diff --git "a/wandb/run-20220317_164114-2vzd8l55/files/output.log" "b/wandb/run-20220317_164114-2vzd8l55/files/output.log" new file mode 100644--- /dev/null +++ "b/wandb/run-20220317_164114-2vzd8l55/files/output.log" @@ -0,0 +1,10246 @@ + + + 0%| | 0/17840 [00:00> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:20,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:22,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.5557, 'learning_rate': 0.0, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:24,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 1/17840 [00:08<43:41:14, 8.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:41:26,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:28,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:30,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.7327, 'learning_rate': 1.0000000000000001e-07, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:32,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 2/17840 [00:16<41:35:54, 8.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:41:34,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:36,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:38,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.6364, 'learning_rate': 2.0000000000000002e-07, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:40,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 3/17840 [00:24<39:59:47, 8.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:41:41,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:43,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:45,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.6572, 'learning_rate': 3.0000000000000004e-07, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:47,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 4/17840 [00:32<38:47:05, 7.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:41:49,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:51,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:53,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4952, 'learning_rate': 4.0000000000000003e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 5/17840 [00:39<37:59:46, 7.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:41:56,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:41:58,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:00,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4896, 'learning_rate': 5.000000000000001e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:02,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 6/17840 [00:46<37:35:23, 7.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:04,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:06,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:07,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:09,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 7/17840 [00:54<37:13:02, 7.51s/it] + + 0%| | 7/17840 [00:54<37:13:02, 7.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:11,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:13,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:15,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.346, 'learning_rate': 7.000000000000001e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:17,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 8/17840 [01:01<37:00:30, 7.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:19,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:20,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:22,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.5115, 'learning_rate': 8.000000000000001e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:24,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 9/17840 [01:08<36:43:49, 7.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:26,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:28,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:29,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.434, 'learning_rate': 9e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:31,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 10/17840 [01:16<36:32:13, 7.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:33,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:35,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:37,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4992, 'learning_rate': 1.0000000000000002e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:38,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 11/17840 [01:23<36:13:14, 7.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:40,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:42,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:44,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:45,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 12/17840 [01:30<36:00:16, 7.27s/it] + + 0%| | 12/17840 [01:30<36:00:16, 7.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:47,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:49,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:51,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3491, 'learning_rate': 1.2000000000000002e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:53,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 13/17840 [01:37<35:42:05, 7.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:42:54,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:56,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:42:58,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:00,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 14/17840 [01:44<35:31:05, 7.17s/it] + + 0%| | 14/17840 [01:44<35:31:05, 7.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:02,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:03,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.278, 'learning_rate': 1.4000000000000001e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:07,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 15/17840 [01:51<35:12:21, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:08,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:10,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:12,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3575, 'learning_rate': 1.5e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:14,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 16/17840 [01:58<34:55:34, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:15,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:17,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:19,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:21,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 17/17840 [02:05<34:45:35, 7.02s/it] + + 0%| | 17/17840 [02:05<34:45:35, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:22,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:24,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:26,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4326, 'learning_rate': 1.6000000000000001e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:27,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 18/17840 [02:12<34:22:45, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:29,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:31,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:32,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:34,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 19/17840 [02:19<34:10:30, 6.90s/it] + + 0%| | 19/17840 [02:19<34:10:30, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:36,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:38,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:39,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:41,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 20/17840 [02:25<34:04:23, 6.88s/it] + + 0%| | 20/17840 [02:25<34:04:23, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:43,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:44,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:46,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1842, 'learning_rate': 1.9e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:48,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 21/17840 [02:32<33:45:51, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:49,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:51,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:53,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:54,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 22/17840 [02:39<33:36:41, 6.79s/it] + 0%| | 22/17840 [02:39<33:36:41, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:43:56,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:58,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:43:59,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:01,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 23/17840 [02:45<33:16:28, 6.72s/it] + + 0%| | 23/17840 [02:45<33:16:28, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:03,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:04,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:06,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:07,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 24/17840 [02:52<32:58:50, 6.66s/it] + + 0%| | 24/17840 [02:52<32:58:50, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:09,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:11,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:12,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.129, 'learning_rate': 2.3e-06, 'epoch': 0.03} +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:16,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 25/17840 [03:01<35:57:54, 7.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:18,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:19,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:21,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.234, 'learning_rate': 2.4000000000000003e-06, 'epoch': 0.03} +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:23,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 26/17840 [03:07<34:47:48, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:24,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:26,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:27,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:24,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:27,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:24,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [03:13<33:50:21, 6.84s/it]g-point operations will not be computed-17 16:44:24,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [03:13<33:50:21, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:31,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:34,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:31,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:20<33:12:41, 6.71s/it]g-point operations will not be computed-17 16:44:31,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:20<33:12:41, 6.71s/it]g-point operations will not be computed-17 16:44:31,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:20<33:12:41, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:37,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:20<33:12:41, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:37,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:26<32:47:12, 6.63s/it]g-point operations will not be computed-17 16:44:37,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:26<32:47:12, 6.63s/it]g-point operations will not be computed-17 16:44:37,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:26<32:47:12, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:43,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:26<32:47:12, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:43,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:33<32:21:51, 6.54s/it]g-point operations will not be computed-17 16:44:43,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:33<32:21:51, 6.54s/it]g-point operations will not be computed-17 16:44:43,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:33<32:21:51, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:50,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:33<32:21:51, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:50,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:53,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:50,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:53,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:50,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 31/17840 [03:39<31:59:12, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 31/17840 [03:39<31:59:12, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:44:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:59,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:44:59,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:44:56,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 32/17840 [03:45<31:25:09, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:02,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 32/17840 [03:45<31:25:09, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:02,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:05,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:02,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:05,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:02,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 33/17840 [03:51<31:10:29, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:08,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 33/17840 [03:51<31:10:29, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:08,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:11,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:08,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:11,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:08,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 34/17840 [03:57<30:34:32, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:14,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 34/17840 [03:57<30:34:32, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:14,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 35/17840 [04:03<29:55:51, 6.05s/it]g-point operations will not be computed-17 16:45:14,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 35/17840 [04:03<29:55:51, 6.05s/it]g-point operations will not be computed-17 16:45:14,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 35/17840 [04:03<29:55:51, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:20,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:23,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:20,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 36/17840 [04:09<29:19:28, 5.93s/it]g-point operations will not be computed-17 16:45:20,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 36/17840 [04:09<29:19:28, 5.93s/it]g-point operations will not be computed-17 16:45:20,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 36/17840 [04:09<29:19:28, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:25,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:28,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:25,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:28,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:25,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 37/17840 [04:14<28:46:10, 5.82s/it]g-point operations will not be computed-17 16:45:25,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 37/17840 [04:14<28:46:10, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:31,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:34,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:31,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:34,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:31,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 38/17840 [04:20<28:11:00, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:36,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:39,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:36,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 39/17840 [04:25<27:36:49, 5.58s/it]g-point operations will not be computed-17 16:45:36,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 39/17840 [04:25<27:36:49, 5.58s/it]g-point operations will not be computed-17 16:45:36,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 39/17840 [04:25<27:36:49, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:42,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:44,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:42,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:44,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:42,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 40/17840 [04:30<27:02:59, 5.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:47,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 40/17840 [04:30<27:02:59, 5.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:47,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 41/17840 [04:35<26:15:17, 5.31s/it]g-point operations will not be computed-17 16:45:47,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 41/17840 [04:35<26:15:17, 5.31s/it]g-point operations will not be computed-17 16:45:47,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 41/17840 [04:35<26:15:17, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:52,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 42/17840 [04:40<25:18:15, 5.12s/it]g-point operations will not be computed-17 16:45:52,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 42/17840 [04:40<25:18:15, 5.12s/it]g-point operations will not be computed-17 16:45:52,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 42/17840 [04:40<25:18:15, 5.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:45:56,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:58,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:56,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:45:58,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:45:56,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 43/17840 [04:44<24:06:07, 4.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:01,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 44/17840 [04:48<22:45:30, 4.60s/it]g-point operations will not be computed-17 16:46:01,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 44/17840 [04:48<22:45:30, 4.60s/it]g-point operations will not be computed-17 16:46:01,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 44/17840 [04:48<22:45:30, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:04,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 45/17840 [04:51<21:08:21, 4.28s/it]g-point operations will not be computed-17 16:46:04,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 45/17840 [04:51<21:08:21, 4.28s/it]g-point operations will not be computed-17 16:46:04,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:09,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:08,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:09,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:08,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 46/17840 [04:55<19:29:20, 3.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:11,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 47/17840 [04:57<17:52:12, 3.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:14,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 47/17840 [04:57<17:52:12, 3.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:14,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 48/17840 [05:00<16:14:54, 3.29s/it]g-point operations will not be computed-17 16:46:14,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 48/17840 [05:00<16:14:54, 3.29s/it]g-point operations will not be computed-17 16:46:14,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 49/17840 [05:02<14:40:46, 2.97s/it]g-point operations will not be computed-17 16:46:16,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 49/17840 [05:02<14:40:46, 2.97s/it]g-point operations will not be computed-17 16:46:16,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:19,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:18,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [05:06<16:18:58, 3.30s/it]g-point operations will not be computed-17 16:46:18,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [05:06<16:18:58, 3.30s/it]g-point operations will not be computed-17 16:46:18,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [05:06<16:18:58, 3.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:24,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [05:06<16:18:58, 3.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:24,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:28,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:24,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [05:14<22:55:50, 4.64s/it]g-point operations will not be computed-17 16:46:24,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [05:14<22:55:50, 4.64s/it]g-point operations will not be computed-17 16:46:24,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [05:14<22:55:50, 4.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:31,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [05:14<22:55:50, 4.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:31,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:35,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:31,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [05:22<27:07:40, 5.49s/it]g-point operations will not be computed-17 16:46:31,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [05:22<27:07:40, 5.49s/it]g-point operations will not be computed-17 16:46:31,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [05:22<27:07:40, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:39,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [05:22<27:07:40, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:39,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:43,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:39,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 53/17840 [05:29<30:10:40, 6.11s/it]g-point operations will not be computed-17 16:46:39,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 53/17840 [05:29<30:10:40, 6.11s/it]g-point operations will not be computed-17 16:46:39,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 53/17840 [05:29<30:10:40, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:46,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:50,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:46,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:36<32:02:06, 6.48s/it]g-point operations will not be computed-17 16:46:46,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:36<32:02:06, 6.48s/it]g-point operations will not be computed-17 16:46:46,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:36<32:02:06, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:54,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:36<32:02:06, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:46:54,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:46:57,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:46:54,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:44<33:20:22, 6.75s/it]g-point operations will not be computed-17 16:46:54,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:44<33:20:22, 6.75s/it]g-point operations will not be computed-17 16:46:54,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:44<33:20:22, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:01,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:05,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:01,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:05,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:01,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:51<34:15:26, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:09,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:51<34:15:26, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:09,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:12,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:09,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 57/17840 [05:58<34:42:49, 7.03s/it]g-point operations will not be computed-17 16:47:09,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 57/17840 [05:58<34:42:49, 7.03s/it]g-point operations will not be computed-17 16:47:09,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 57/17840 [05:58<34:42:49, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:16,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 57/17840 [05:58<34:42:49, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:16,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:19,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:16,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:19,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:16,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [06:06<35:02:11, 7.09s/it]g-point operations will not be computed-17 16:47:16,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [06:06<35:02:11, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:23,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:26,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:23,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:13<35:03:00, 7.10s/it]g-point operations will not be computed-17 16:47:23,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:13<35:03:00, 7.10s/it]g-point operations will not be computed-17 16:47:23,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:13<35:03:00, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:30,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:13<35:03:00, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:30,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:34,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:30,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [06:20<35:09:53, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:37,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [06:20<35:09:53, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:37,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5546, 'learning_rate': 5.7000000000000005e-06, 'epoch': 0.07} +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:41,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:37,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:41,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:37,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:27<35:08:16, 7.11s/it]g-point operations will not be computed-17 16:47:37,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:27<35:08:16, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:44,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:27<35:08:16, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:44,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:48,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:44,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:48,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:44,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 62/17840 [06:34<35:06:01, 7.11s/it]g-point operations will not be computed-17 16:47:44,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 62/17840 [06:34<35:06:01, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:51,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:55,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:51,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:47:55,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:47:51,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:41<34:52:30, 7.06s/it]g-point operations will not be computed-17 16:47:51,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:41<34:52:30, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:58,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:41<34:52:30, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:58,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:41<34:52:30, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:47:58,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:48<34:39:43, 7.02s/it]g-point operations will not be computed-17 16:47:58,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:48<34:39:43, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:05,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:48<34:39:43, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:05,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:09,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:05,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:09,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:05,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 65/17840 [06:55<34:27:00, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:12,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 65/17840 [06:55<34:27:00, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:12,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:15,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:12,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:15,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:12,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [07:02<34:13:49, 6.93s/it]g-point operations will not be computed-17 16:48:12,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [07:02<34:13:49, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:19,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [07:02<34:13:49, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:19,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:22,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:19,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:22,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:19,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [07:09<34:05:38, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:26,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [07:09<34:05:38, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:26,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:29,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:26,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:29,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:26,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [07:15<33:52:54, 6.86s/it]g-point operations will not be computed-17 16:48:26,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [07:15<33:52:54, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:33,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:36,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:33,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:36,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:33,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [07:22<33:48:24, 6.85s/it]g-point operations will not be computed-17 16:48:33,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [07:22<33:48:24, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:39,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [07:22<33:48:24, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:39,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 70/17840 [07:29<33:36:29, 6.81s/it]g-point operations will not be computed-17 16:48:39,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 70/17840 [07:29<33:36:29, 6.81s/it]g-point operations will not be computed-17 16:48:39,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 70/17840 [07:29<33:36:29, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:46,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 70/17840 [07:29<33:36:29, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:46,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:49,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:46,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:49,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:46,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 71/17840 [07:36<33:24:28, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:53,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 71/17840 [07:36<33:24:28, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:53,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:56,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:53,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:48:56,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:53,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 72/17840 [07:42<33:15:06, 6.74s/it]g-point operations will not be computed-17 16:48:53,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 72/17840 [07:42<33:15:06, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:48:59,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:03,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:48:59,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 73/17840 [07:49<32:57:29, 6.68s/it]g-point operations will not be computed-17 16:48:59,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 73/17840 [07:49<32:57:29, 6.68s/it]g-point operations will not be computed-17 16:48:59,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 73/17840 [07:49<32:57:29, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:06,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:09,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:06,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [07:55<32:50:21, 6.65s/it]g-point operations will not be computed-17 16:49:06,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [07:55<32:50:21, 6.65s/it]g-point operations will not be computed-17 16:49:06,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [07:55<32:50:21, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:13,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [07:55<32:50:21, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:13,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:16,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:13,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [08:04<35:57:47, 7.29s/it]g-point operations will not be computed-17 16:49:13,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [08:04<35:57:47, 7.29s/it]g-point operations will not be computed-17 16:49:13,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [08:04<35:57:47, 7.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:21,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [08:04<35:57:47, 7.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:21,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:25,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:21,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:25,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:21,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 76/17840 [08:11<34:48:58, 7.06s/it]g-point operations will not be computed-17 16:49:21,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 76/17840 [08:11<34:48:58, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:28,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:31,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:28,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [08:17<33:56:49, 6.88s/it]g-point operations will not be computed-17 16:49:28,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [08:17<33:56:49, 6.88s/it]g-point operations will not be computed-17 16:49:28,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [08:17<33:56:49, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:37,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 78/17840 [08:23<33:07:26, 6.71s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 78/17840 [08:23<33:07:26, 6.71s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:42,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:42,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 79/17840 [08:30<32:28:54, 6.58s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 79/17840 [08:30<32:28:54, 6.58s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3798, 'learning_rate': 7.6e-06, 'epoch': 0.09} +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:50,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 80/17840 [08:36<31:52:06, 6.46s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 80/17840 [08:36<31:52:06, 6.46s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5643, 'learning_rate': 7.7e-06, 'epoch': 0.09} +[WARNING|modeling_utils.py:388] 2022-03-17 16:49:56,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 81/17840 [08:42<31:23:01, 6.36s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 81/17840 [08:42<31:23:01, 6.36s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:01,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:01,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 82/17840 [08:48<31:09:16, 6.32s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 82/17840 [08:48<31:09:16, 6.32s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4375, 'learning_rate': 7.9e-06, 'epoch': 0.09} +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:08,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 83/17840 [08:54<30:50:17, 6.25s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 83/17840 [08:54<30:50:17, 6.25s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6365, 'learning_rate': 8.000000000000001e-06, 'epoch': 0.09} +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:14,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 84/17840 [09:00<30:18:48, 6.15s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 84/17840 [09:00<30:18:48, 6.15s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:19,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:19,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:19,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|�� | 85/17840 [09:06<29:44:24, 6.03s/it]g-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:24,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:27,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:27,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4775, 'learning_rate': 8.3e-06, 'epoch': 0.1} +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:27,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:33,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:33,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:35,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:35,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:35,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:49:34,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 88/17840 [09:23<28:03:24, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:50:39,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 88/17840 [09:23<28:03:24, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:50:39,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:43,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:43,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5192, 'learning_rate': 8.599999999999999e-06, 'epoch': 0.1} +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:47,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:39,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 90/17840 [09:33<26:51:22, 5.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:50:50,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 90/17840 [09:33<26:51:22, 5.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:50:50,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4474, 'learning_rate': 8.7e-06, 'epoch': 0.1} +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:53,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:50,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:53,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:50,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6787, 'learning_rate': 8.8e-06, 'epoch': 0.1} +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:57,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:50,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:50:57,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:50,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 92/17840 [09:42<24:52:38, 5.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:50:59,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:01,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:59,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:01,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:50:59,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 93/17840 [09:47<23:41:56, 4.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:03,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 94/17840 [09:51<22:26:53, 4.55s/it]g-point operations will not be computed-17 16:51:03,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 94/17840 [09:51<22:26:53, 4.55s/it]g-point operations will not be computed-17 16:51:03,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 94/17840 [09:51<22:26:53, 4.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:07,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 95/17840 [09:54<21:15:40, 4.31s/it]g-point operations will not be computed-17 16:51:07,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 95/17840 [09:54<21:15:40, 4.31s/it]g-point operations will not be computed-17 16:51:07,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 95/17840 [09:54<21:15:40, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:11,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 96/17840 [09:58<19:56:45, 4.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:14,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 96/17840 [09:58<19:56:45, 4.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:14,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:16,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:14,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:16,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:14,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 97/17840 [10:01<18:24:18, 3.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:17,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 98/17840 [10:03<16:52:10, 3.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:20,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 98/17840 [10:03<16:52:10, 3.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:20,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 99/17840 [10:06<15:14:57, 3.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:22,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 99/17840 [10:06<15:14:57, 3.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:22,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:23,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:22,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 100/17840 [10:10<16:33:13, 3.36s/it]g-point operations will not be computed-17 16:51:22,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 100/17840 [10:10<16:33:13, 3.36s/it]g-point operations will not be computed-17 16:51:22,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 100/17840 [10:10<16:33:13, 3.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:28,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 100/17840 [10:10<16:33:13, 3.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:28,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:31,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:28,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 101/17840 [10:18<23:26:05, 4.76s/it]g-point operations will not be computed-17 16:51:28,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 101/17840 [10:18<23:26:05, 4.76s/it]g-point operations will not be computed-17 16:51:28,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 101/17840 [10:18<23:26:05, 4.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 101/17840 [10:18<23:26:05, 4.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 101/17840 [10:18<23:26:05, 4.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 102/17840 [10:25<27:42:01, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 102/17840 [10:25<27:42:01, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3833, 'learning_rate': 9.900000000000002e-06, 'epoch': 0.11} + 1%|▍ | 102/17840 [10:25<27:42:01, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:48,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:48,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5521, 'learning_rate': 1e-05, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:48,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:48,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:51:48,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 104/17840 [10:40<32:26:01, 6.58s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 104/17840 [10:40<32:26:01, 6.58s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 104/17840 [10:40<32:26:01, 6.58s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 104/17840 [10:40<32:26:01, 6.58s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 104/17840 [10:40<32:26:01, 6.58s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [10:48<33:37:34, 6.83s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [10:48<33:37:34, 6.83s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:52:09,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 106/17840 [10:55<34:17:33, 6.96s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 106/17840 [10:55<34:17:33, 6.96s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5175, 'learning_rate': 1.03e-05, 'epoch': 0.12} + 1%|▍ | 106/17840 [10:55<34:17:33, 6.96s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 106/17840 [10:55<34:17:33, 6.96s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 106/17840 [10:55<34:17:33, 6.96s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 107/17840 [11:02<34:40:50, 7.04s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 107/17840 [11:02<34:40:50, 7.04s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:52:23,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 108/17840 [11:10<35:00:27, 7.11s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 108/17840 [11:10<35:00:27, 7.11s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6291, 'learning_rate': 1.05e-05, 'epoch': 0.12} + 1%|▍ | 108/17840 [11:10<35:00:27, 7.11s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 108/17840 [11:10<35:00:27, 7.11s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 108/17840 [11:10<35:00:27, 7.11s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 109/17840 [11:17<35:10:18, 7.14s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 109/17840 [11:17<35:10:18, 7.14s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 109/17840 [11:17<35:10:18, 7.14s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:52:39,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:52:39,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3494, 'learning_rate': 1.0700000000000001e-05, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-17 16:52:39,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:52:39,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:52:39,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 111/17840 [11:31<35:06:01, 7.13s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 111/17840 [11:31<35:06:01, 7.13s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:52:52,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [11:38<34:57:09, 7.10s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [11:38<34:57:09, 7.10s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3961, 'learning_rate': 1.09e-05, 'epoch': 0.13} + 1%|▍ | 112/17840 [11:38<34:57:09, 7.10s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [11:38<34:57:09, 7.10s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [11:38<34:57:09, 7.10s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 113/17840 [11:45<34:46:10, 7.06s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:04,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:04,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 114/17840 [11:52<34:42:31, 7.05s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 114/17840 [11:52<34:42:31, 7.05s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3281, 'learning_rate': 1.11e-05, 'epoch': 0.13} + 1%|▍ | 114/17840 [11:52<34:42:31, 7.05s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:14,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:14,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3881, 'learning_rate': 1.1200000000000001e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:14,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:14,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:14,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 116/17840 [12:06<34:13:45, 6.95s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:25,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:25,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 117/17840 [12:13<33:59:22, 6.90s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 117/17840 [12:13<33:59:22, 6.90s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4443, 'learning_rate': 1.1400000000000001e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:33,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 118/17840 [12:19<33:43:36, 6.85s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 118/17840 [12:19<33:43:36, 6.85s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3055, 'learning_rate': 1.1500000000000002e-05, 'epoch': 0.13} + 1%|▌ | 118/17840 [12:19<33:43:36, 6.85s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 118/17840 [12:19<33:43:36, 6.85s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 118/17840 [12:19<33:43:36, 6.85s/it]g-point operations will not be computed-17 16:51:35,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 119/17840 [12:26<33:28:07, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 119/17840 [12:26<33:28:07, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 119/17840 [12:26<33:28:07, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 120/17840 [12:33<33:22:05, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 120/17840 [12:33<33:22:05, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5342, 'learning_rate': 1.1700000000000001e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-17 16:53:53,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 121/17840 [12:39<33:15:05, 6.76s/it]g-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 121/17840 [12:39<33:15:05, 6.76s/it]g-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4666, 'learning_rate': 1.18e-05, 'epoch': 0.14} + 1%|▌ | 121/17840 [12:39<33:15:05, 6.76s/it]g-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:02,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:02,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3724, 'learning_rate': 1.19e-05, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:02,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:02,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 123/17840 [12:53<32:51:29, 6.68s/it]g-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 123/17840 [12:53<32:51:29, 6.68s/it]g-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:12,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:12,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 124/17840 [12:59<32:40:48, 6.64s/it]g-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 124/17840 [12:59<32:40:48, 6.64s/it]g-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5247, 'learning_rate': 1.2100000000000001e-05, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:20,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 125/17840 [13:08<36:04:16, 7.33s/it]g-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 125/17840 [13:08<36:04:16, 7.33s/it]g-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4356, 'learning_rate': 1.22e-05, 'epoch': 0.14} + 1%|▌ | 125/17840 [13:08<36:04:16, 7.33s/it]g-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 125/17840 [13:08<36:04:16, 7.33s/it]g-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 125/17840 [13:08<36:04:16, 7.33s/it]g-point operations will not be computed-17 16:53:43,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 126/17840 [13:15<34:54:38, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:32,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 126/17840 [13:15<34:54:38, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:32,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 126/17840 [13:15<34:54:38, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:32,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 127/17840 [13:21<34:01:51, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 127/17840 [13:21<34:01:51, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5675, 'learning_rate': 1.24e-05, 'epoch': 0.14} + 1%|▌ | 127/17840 [13:21<34:01:51, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 128/17840 [13:28<33:10:01, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 128/17840 [13:28<33:10:01, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 129/17840 [13:34<32:24:50, 6.59s/it]g-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 129/17840 [13:34<32:24:50, 6.59s/it]g-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:52,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:52,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 130/17840 [13:40<31:52:41, 6.48s/it]g-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 130/17840 [13:40<31:52:41, 6.48s/it]g-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:59,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:54:59,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 131/17840 [13:46<31:27:42, 6.40s/it]g-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 131/17840 [13:46<31:27:42, 6.40s/it]g-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:05,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:05,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 132/17840 [13:52<31:03:52, 6.32s/it]g-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 132/17840 [13:52<31:03:52, 6.32s/it]g-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:11,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:11,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 133/17840 [13:58<30:28:05, 6.19s/it]g-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 133/17840 [13:58<30:28:05, 6.19s/it]g-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:17,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:17,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:17,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:54:38,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 134/17840 [14:04<29:49:14, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:21,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 134/17840 [14:04<29:49:14, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:21,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:25,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:21,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:25,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:21,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3198, 'learning_rate': 1.32e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:29,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:21,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 136/17840 [14:15<28:42:30, 5.84s/it]g-point operations will not be computed-17 16:55:21,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 136/17840 [14:15<28:42:30, 5.84s/it]g-point operations will not be computed-17 16:55:21,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:34,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:21,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:34,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:21,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 137/17840 [14:21<28:12:18, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 137/17840 [14:21<28:12:18, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.706, 'learning_rate': 1.3400000000000002e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:42,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:42,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4342, 'learning_rate': 1.3500000000000001e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:45,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 139/17840 [14:31<26:56:12, 5.48s/it]g-point operations will not be computed-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 139/17840 [14:31<26:56:12, 5.48s/it]g-point operations will not be computed-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:49,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:52,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:52,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:54,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:56,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:56,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:56,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:55:59,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:55:38,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 142/17840 [14:45<23:47:00, 4.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:02,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 142/17840 [14:45<23:47:00, 4.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:02,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:03,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:02,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:03,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:02,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 143/17840 [14:49<22:24:46, 4.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:05,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 144/17840 [14:52<20:55:47, 4.26s/it]g-point operations will not be computed-17 16:56:05,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 144/17840 [14:52<20:55:47, 4.26s/it]g-point operations will not be computed-17 16:56:05,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 144/17840 [14:52<20:55:47, 4.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:09,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 144/17840 [14:52<20:55:47, 4.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:09,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 145/17840 [14:56<19:40:08, 4.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:12,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:14,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:12,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:14,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:12,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 146/17840 [14:59<18:22:18, 3.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:15,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 146/17840 [14:59<18:22:18, 3.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:15,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 147/17840 [15:02<17:05:38, 3.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:18,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 147/17840 [15:02<17:05:38, 3.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:18,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 148/17840 [15:04<15:48:08, 3.22s/it]g-point operations will not be computed-17 16:56:18,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 148/17840 [15:04<15:48:08, 3.22s/it]g-point operations will not be computed-17 16:56:18,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 149/17840 [15:07<14:31:25, 2.96s/it]g-point operations will not be computed-17 16:56:21,114 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:24,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:23,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:24,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:23,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 150/17840 [15:11<15:59:35, 3.25s/it]g-point operations will not be computed-17 16:56:23,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 150/17840 [15:11<15:59:35, 3.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:28,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 150/17840 [15:11<15:59:35, 3.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:28,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:32,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:28,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:32,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:28,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 151/17840 [15:19<22:44:07, 4.63s/it]g-point operations will not be computed-17 16:56:28,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 151/17840 [15:19<22:44:07, 4.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 151/17840 [15:19<22:44:07, 4.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:40,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:40,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 152/17840 [15:26<26:57:25, 5.49s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 152/17840 [15:26<26:57:25, 5.49s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 152/17840 [15:26<26:57:25, 5.49s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 152/17840 [15:26<26:57:25, 5.49s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:49,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:49,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:49,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:49,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:56:49,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 154/17840 [15:41<31:39:28, 6.44s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 154/17840 [15:41<31:39:28, 6.44s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 154/17840 [15:41<31:39:28, 6.44s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 154/17840 [15:41<31:39:28, 6.44s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 154/17840 [15:41<31:39:28, 6.44s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 155/17840 [15:48<32:56:54, 6.71s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:07,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:07,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:07,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [15:55<33:36:05, 6.84s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [15:55<33:36:05, 6.84s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [15:55<33:36:05, 6.84s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [15:55<33:36:05, 6.84s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [15:55<33:36:05, 6.84s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 157/17840 [16:03<34:08:42, 6.95s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:22,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:22,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:22,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [16:10<34:26:42, 7.01s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [16:10<34:26:42, 7.01s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [16:10<34:26:42, 7.01s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [16:10<34:26:42, 7.01s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [16:10<34:26:42, 7.01s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 159/17840 [16:17<34:37:35, 7.05s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:36,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:36,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [16:24<34:37:58, 7.05s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [16:24<34:37:58, 7.05s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3259, 'learning_rate': 1.5700000000000002e-05, 'epoch': 0.18} + 1%|▋ | 160/17840 [16:24<34:37:58, 7.05s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:46,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:46,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3384, 'learning_rate': 1.58e-05, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:46,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:46,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:46,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 162/17840 [16:38<34:21:30, 7.00s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:57,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:57:57,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 163/17840 [16:45<34:14:08, 6.97s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 163/17840 [16:45<34:14:08, 6.97s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3544, 'learning_rate': 1.6000000000000003e-05, 'epoch': 0.18} + 1%|▋ | 163/17840 [16:45<34:14:08, 6.97s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 163/17840 [16:45<34:14:08, 6.97s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 163/17840 [16:45<34:14:08, 6.97s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 164/17840 [16:52<34:10:08, 6.96s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:11,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:11,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 165/17840 [16:58<33:56:56, 6.91s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 165/17840 [16:58<33:56:56, 6.91s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.39, 'learning_rate': 1.62e-05, 'epoch': 0.18} + 1%|▋ | 165/17840 [16:58<33:56:56, 6.91s/it]g-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:21,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:21,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.424, 'learning_rate': 1.63e-05, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:21,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:21,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:21,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:56:36,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 167/17840 [17:12<33:31:54, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 167/17840 [17:12<33:31:54, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 167/17840 [17:12<33:31:54, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 168/17840 [17:19<33:33:48, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 168/17840 [17:19<33:33:48, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1713, 'learning_rate': 1.65e-05, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:39,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 169/17840 [17:25<33:21:32, 6.80s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 169/17840 [17:25<33:21:32, 6.80s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1893, 'learning_rate': 1.66e-05, 'epoch': 0.19} + 1%|▋ | 169/17840 [17:25<33:21:32, 6.80s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:48,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:48,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3378, 'learning_rate': 1.6700000000000003e-05, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:48,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:48,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 171/17840 [17:39<33:02:20, 6.73s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 171/17840 [17:39<33:02:20, 6.73s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:58,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:58:58,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 172/17840 [17:45<32:57:05, 6.71s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 172/17840 [17:45<32:57:05, 6.71s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4631, 'learning_rate': 1.69e-05, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:06,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 173/17840 [17:52<32:42:52, 6.67s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 173/17840 [17:52<32:42:52, 6.67s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4085, 'learning_rate': 1.7000000000000003e-05, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:12,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 174/17840 [17:59<32:28:04, 6.62s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 174/17840 [17:59<32:28:04, 6.62s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2214, 'learning_rate': 1.7100000000000002e-05, 'epoch': 0.2} + 1%|▋ | 174/17840 [17:59<32:28:04, 6.62s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 174/17840 [17:59<32:28:04, 6.62s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 174/17840 [17:59<32:28:04, 6.62s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 174/17840 [17:59<32:28:04, 6.62s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 174/17840 [17:59<32:28:04, 6.62s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:26,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:26,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 176/17840 [18:14<34:20:25, 7.00s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 176/17840 [18:14<34:20:25, 7.00s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:32,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:32,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 177/17840 [18:20<33:18:25, 6.79s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 177/17840 [18:20<33:18:25, 6.79s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:39,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:39,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 178/17840 [18:26<32:32:09, 6.63s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 178/17840 [18:26<32:32:09, 6.63s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3112, 'learning_rate': 1.75e-05, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:46,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 179/17840 [18:32<31:46:07, 6.48s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 179/17840 [18:32<31:46:07, 6.48s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.431, 'learning_rate': 1.76e-05, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:52,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 180/17840 [18:38<31:17:49, 6.38s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 180/17840 [18:38<31:17:49, 6.38s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:57,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:59:57,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 181/17840 [18:45<30:51:52, 6.29s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 181/17840 [18:45<30:51:52, 6.29s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:03,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:03,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 182/17840 [18:51<30:34:54, 6.23s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 182/17840 [18:51<30:34:54, 6.23s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:09,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:09,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 183/17840 [18:57<30:02:13, 6.12s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 183/17840 [18:57<30:02:13, 6.12s/it]g-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:15,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:15,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:58:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 184/17840 [19:02<29:34:13, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:00:19,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 184/17840 [19:02<29:34:13, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:00:19,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4065, 'learning_rate': 1.81e-05, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:23,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:19,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:23,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:19,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.428, 'learning_rate': 1.8200000000000002e-05, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:28,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:19,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:28,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:19,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 186/17840 [19:14<28:30:18, 5.81s/it]g-point operations will not be computed-17 17:00:19,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:32,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:19,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:32,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:19,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:32,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:19,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 187/17840 [19:19<27:58:32, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:00:36,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 187/17840 [19:19<27:58:32, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:00:36,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:40,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:36,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:40,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:36,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2166, 'learning_rate': 1.85e-05, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:44,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:36,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:44,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:36,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 189/17840 [19:30<27:00:01, 5.51s/it]g-point operations will not be computed-17 17:00:36,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:36,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:50,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:36,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:50,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:36,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4367, 'learning_rate': 1.87e-05, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:54,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:36,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:00:54,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:36,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 191/17840 [19:40<25:40:15, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 191/17840 [19:40<25:40:15, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 191/17840 [19:40<25:40:15, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:00,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:02,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:04,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:04,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:06,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:06,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:08,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:10,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:10,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:12,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:13,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:13,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:15,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:15,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:18,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:20,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:20,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:22,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:22,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:24,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:27,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:27,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7641, 'learning_rate': 1.97e-05, 'epoch': 0.22} +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:31,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:31,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:35,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:35,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1663, 'learning_rate': 1.9800000000000004e-05, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:38,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:38,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:38,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 202/17840 [20:27<27:13:28, 5.56s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 202/17840 [20:27<27:13:28, 5.56s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 202/17840 [20:27<27:13:28, 5.56s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 202/17840 [20:27<27:13:28, 5.56s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 202/17840 [20:27<27:13:28, 5.56s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 203/17840 [20:34<30:06:56, 6.15s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 203/17840 [20:34<30:06:56, 6.15s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:01:55,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 204/17840 [20:42<31:52:16, 6.51s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 204/17840 [20:42<31:52:16, 6.51s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1979, 'learning_rate': 2.01e-05, 'epoch': 0.23} + 1%|▊ | 204/17840 [20:42<31:52:16, 6.51s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 204/17840 [20:42<31:52:16, 6.51s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 204/17840 [20:42<31:52:16, 6.51s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 205/17840 [20:49<32:57:54, 6.73s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 205/17840 [20:49<32:57:54, 6.73s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 205/17840 [20:49<32:57:54, 6.73s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1892, 'learning_rate': 2.0300000000000002e-05, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:12,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 207/17840 [21:03<34:21:55, 7.02s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 207/17840 [21:03<34:21:55, 7.02s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 207/17840 [21:03<34:21:55, 7.02s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 207/17840 [21:03<34:21:55, 7.02s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 207/17840 [21:03<34:21:55, 7.02s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 208/17840 [21:11<34:40:12, 7.08s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:30,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:30,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:30,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 209/17840 [21:18<34:41:49, 7.08s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 209/17840 [21:18<34:41:49, 7.08s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 209/17840 [21:18<34:41:49, 7.08s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 209/17840 [21:18<34:41:49, 7.08s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 209/17840 [21:18<34:41:49, 7.08s/it]g-point operations will not be computed-17 17:00:56,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 210/17840 [21:25<34:39:23, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 210/17840 [21:25<34:39:23, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 210/17840 [21:25<34:39:23, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 210/17840 [21:25<34:39:23, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 211/17840 [21:32<34:43:44, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 211/17840 [21:32<34:43:44, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 211/17840 [21:32<34:43:44, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:55,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:55,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3277, 'learning_rate': 2.09e-05, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:55,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:55,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:02:55,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 213/17840 [21:46<34:39:18, 7.08s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 213/17840 [21:46<34:39:18, 7.08s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 213/17840 [21:46<34:39:18, 7.08s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:09,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:09,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3635, 'learning_rate': 2.11e-05, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:09,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:09,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:09,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 215/17840 [22:00<34:14:00, 6.99s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:19,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:19,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 216/17840 [22:07<34:04:50, 6.96s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 216/17840 [22:07<34:04:50, 6.96s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3756, 'learning_rate': 2.13e-05, 'epoch': 0.24} + 1%|▉ | 216/17840 [22:07<34:04:50, 6.96s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:29,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:29,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3538, 'learning_rate': 2.1400000000000002e-05, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:29,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:29,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:29,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 218/17840 [22:21<33:53:53, 6.93s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:40,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:40,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 219/17840 [22:27<33:40:25, 6.88s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 219/17840 [22:27<33:40:25, 6.88s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.336, 'learning_rate': 2.16e-05, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:48,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 220/17840 [22:34<33:30:30, 6.85s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 220/17840 [22:34<33:30:30, 6.85s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3172, 'learning_rate': 2.1700000000000002e-05, 'epoch': 0.25} + 1%|▉ | 220/17840 [22:34<33:30:30, 6.85s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:56,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:56,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.284, 'learning_rate': 2.18e-05, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:56,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:03:56,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 222/17840 [22:48<33:13:54, 6.79s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 222/17840 [22:48<33:13:54, 6.79s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3756, 'learning_rate': 2.19e-05, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:08,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 223/17840 [22:54<33:09:13, 6.77s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 223/17840 [22:54<33:09:13, 6.77s/it]g-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3964, 'learning_rate': 2.2000000000000003e-05, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:15,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:15,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:02:42,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 224/17840 [23:01<32:54:30, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 224/17840 [23:01<32:54:30, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 224/17840 [23:01<32:54:30, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 225/17840 [23:10<35:59:31, 7.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 225/17840 [23:10<35:59:31, 7.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4015, 'learning_rate': 2.22e-05, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:30,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 226/17840 [23:16<34:49:27, 7.12s/it]g-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 226/17840 [23:16<34:49:27, 7.12s/it]g-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5593, 'learning_rate': 2.23e-05, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:37,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 227/17840 [23:23<33:45:36, 6.90s/it]g-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 227/17840 [23:23<33:45:36, 6.90s/it]g-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3346, 'learning_rate': 2.2400000000000002e-05, 'epoch': 0.25} + 1%|▉ | 227/17840 [23:23<33:45:36, 6.90s/it]g-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:45,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:45,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2318, 'learning_rate': 2.25e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:45,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:51,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:51,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2598, 'learning_rate': 2.26e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:51,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:57,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:57,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2917, 'learning_rate': 2.2700000000000003e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 17:04:57,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:03,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:03,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2995, 'learning_rate': 2.2800000000000002e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:03,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:10,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:10,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3966, 'learning_rate': 2.29e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:10,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:15,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:15,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2922, 'learning_rate': 2.3000000000000003e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:20,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:20,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 234/17840 [24:06<29:51:53, 6.11s/it]g-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 234/17840 [24:06<29:51:53, 6.11s/it]g-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:26,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:26,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 235/17840 [24:12<29:26:57, 6.02s/it]g-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:30,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:30,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:30,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 236/17840 [24:17<28:56:05, 5.92s/it]g-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:36,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:36,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:36,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:04:18,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 237/17840 [24:23<28:28:30, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:05:40,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 237/17840 [24:23<28:28:30, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:05:40,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 237/17840 [24:23<28:28:30, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:05:40,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:44,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:40,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:44,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:40,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:48,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:40,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:48,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:40,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 239/17840 [24:34<27:21:05, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:05:51,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 239/17840 [24:34<27:21:05, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:05:51,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:54,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:51,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:54,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:51,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4633, 'learning_rate': 2.37e-05, 'epoch': 0.27} +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:58,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:51,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:05:58,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:05:51,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 241/17840 [24:44<25:54:55, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:03,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:03,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 242/17840 [24:48<24:40:39, 5.05s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:06,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:06,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:08,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:10,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:10,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:12,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:14,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:14,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:15,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:19,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:19,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:20,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:20,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:23,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:23,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:24,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:26,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:26,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:28,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:30,851 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:30,851 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3115, 'learning_rate': 2.47e-05, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:34,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:34,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:34,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:38,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:38,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:42,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:42,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:42,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 252/17840 [25:30<26:59:58, 5.53s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 252/17840 [25:30<26:59:58, 5.53s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 252/17840 [25:30<26:59:58, 5.53s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:53,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:53,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1997, 'learning_rate': 2.5e-05, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:53,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:06:53,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 254/17840 [25:45<31:43:02, 6.49s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 254/17840 [25:45<31:43:02, 6.49s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3909, 'learning_rate': 2.51e-05, 'epoch': 0.28} + 1%|█ | 254/17840 [25:45<31:43:02, 6.49s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 254/17840 [25:45<31:43:02, 6.49s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 254/17840 [25:45<31:43:02, 6.49s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 255/17840 [25:52<32:51:06, 6.73s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:12,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:12,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 256/17840 [26:00<33:40:26, 6.89s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 256/17840 [26:00<33:40:26, 6.89s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.231, 'learning_rate': 2.5300000000000002e-05, 'epoch': 0.29} + 1%|█ | 256/17840 [26:00<33:40:26, 6.89s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 256/17840 [26:00<33:40:26, 6.89s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 256/17840 [26:00<33:40:26, 6.89s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 257/17840 [26:07<33:59:30, 6.96s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 257/17840 [26:07<33:59:30, 6.96s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 257/17840 [26:07<33:59:30, 6.96s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:29,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:29,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2382, 'learning_rate': 2.5500000000000003e-05, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:29,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:29,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:29,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 259/17840 [26:21<34:26:21, 7.05s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 259/17840 [26:21<34:26:21, 7.05s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:42,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [26:28<34:34:15, 7.08s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [26:28<34:34:15, 7.08s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3874, 'learning_rate': 2.57e-05, 'epoch': 0.29} + 1%|█ | 260/17840 [26:28<34:34:15, 7.08s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [26:28<34:34:15, 7.08s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [26:28<34:34:15, 7.08s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 261/17840 [26:35<34:28:39, 7.06s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:54,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:07:54,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 262/17840 [26:42<34:21:28, 7.04s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 262/17840 [26:42<34:21:28, 7.04s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1782, 'learning_rate': 2.5900000000000003e-05, 'epoch': 0.29} + 1%|█ | 262/17840 [26:42<34:21:28, 7.04s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 262/17840 [26:42<34:21:28, 7.04s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 262/17840 [26:42<34:21:28, 7.04s/it]g-point operations will not be computed-17 17:06:01,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 263/17840 [26:49<34:17:29, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 263/17840 [26:49<34:17:29, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 263/17840 [26:49<34:17:29, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 263/17840 [26:49<34:17:29, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 264/17840 [26:56<34:02:54, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 264/17840 [26:56<34:02:54, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:17,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 265/17840 [27:03<33:55:54, 6.95s/it]g-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 265/17840 [27:03<33:55:54, 6.95s/it]g-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3265, 'learning_rate': 2.6200000000000003e-05, 'epoch': 0.3} + 1%|█▏ | 265/17840 [27:03<33:55:54, 6.95s/it]g-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 265/17840 [27:03<33:55:54, 6.95s/it]g-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 265/17840 [27:03<33:55:54, 6.95s/it]g-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 266/17840 [27:10<33:56:05, 6.95s/it]g-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:29,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:29,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:29,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 267/17840 [27:17<33:47:06, 6.92s/it]g-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 267/17840 [27:17<33:47:06, 6.92s/it]g-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:37,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 268/17840 [27:24<33:39:49, 6.90s/it]g-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 268/17840 [27:24<33:39:49, 6.90s/it]g-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5252, 'learning_rate': 2.6500000000000004e-05, 'epoch': 0.3} + 2%|█▏ | 268/17840 [27:24<33:39:49, 6.90s/it]g-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 268/17840 [27:24<33:39:49, 6.90s/it]g-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 268/17840 [27:24<33:39:49, 6.90s/it]g-point operations will not be computed-17 17:08:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [27:30<33:24:48, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:08:48,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [27:30<33:24:48, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:08:48,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [27:30<33:24:48, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:08:48,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 270/17840 [27:37<33:22:39, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:08:48,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 270/17840 [27:37<33:22:39, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:08:48,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4708, 'learning_rate': 2.6700000000000002e-05, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-17 17:08:58,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:08:48,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 271/17840 [27:44<33:07:50, 6.79s/it]g-point operations will not be computed-17 17:08:48,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 271/17840 [27:44<33:07:50, 6.79s/it]g-point operations will not be computed-17 17:08:48,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0956, 'learning_rate': 2.6800000000000004e-05, 'epoch': 0.3} + 2%|█▏ | 271/17840 [27:44<33:07:50, 6.79s/it]g-point operations will not be computed-17 17:08:48,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 271/17840 [27:44<33:07:50, 6.79s/it]g-point operations will not be computed-17 17:08:48,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 271/17840 [27:44<33:07:50, 6.79s/it]g-point operations will not be computed-17 17:08:48,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 272/17840 [27:50<32:56:14, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 272/17840 [27:50<32:56:14, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 272/17840 [27:50<32:56:14, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 272/17840 [27:50<32:56:14, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 273/17840 [27:57<32:38:37, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:16,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:16,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 274/17840 [28:04<32:33:06, 6.67s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 274/17840 [28:04<32:33:06, 6.67s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1858, 'learning_rate': 2.7100000000000005e-05, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:24,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 275/17840 [28:13<35:56:37, 7.37s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 275/17840 [28:13<35:56:37, 7.37s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3989, 'learning_rate': 2.7200000000000004e-05, 'epoch': 0.31} + 2%|█▏ | 275/17840 [28:13<35:56:37, 7.37s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:35,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:35,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3199, 'learning_rate': 2.7300000000000003e-05, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:35,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:35,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:35,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 277/17840 [28:26<33:34:30, 6.88s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:44,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:44,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:44,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 278/17840 [28:32<32:47:41, 6.72s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:51,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:51,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 279/17840 [28:38<32:08:16, 6.59s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 279/17840 [28:38<32:08:16, 6.59s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:57,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:09:57,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 280/17840 [28:44<31:41:46, 6.50s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 280/17840 [28:44<31:41:46, 6.50s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4213, 'learning_rate': 2.7700000000000002e-05, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:05,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 281/17840 [28:51<31:24:03, 6.44s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 281/17840 [28:51<31:24:03, 6.44s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:09,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:09,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 282/17840 [28:57<30:54:23, 6.34s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 282/17840 [28:57<30:54:23, 6.34s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:15,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:15,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 283/17840 [29:03<30:21:44, 6.23s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 283/17840 [29:03<30:21:44, 6.23s/it]g-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:21,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:21,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:09:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 284/17840 [29:09<29:41:45, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:10:26,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 284/17840 [29:09<29:41:45, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:10:26,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3376, 'learning_rate': 2.8100000000000005e-05, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:30,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:26,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:30,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:26,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:30,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:26,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3763, 'learning_rate': 2.8199999999999998e-05, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:35,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:26,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:35,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:26,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2748, 'learning_rate': 2.83e-05, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:40,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:26,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 287/17840 [29:25<28:02:58, 5.75s/it]g-point operations will not be computed-17 17:10:26,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 287/17840 [29:25<28:02:58, 5.75s/it]g-point operations will not be computed-17 17:10:26,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:44,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:26,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:44,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:26,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 288/17840 [29:31<27:31:44, 5.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:10:48,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 288/17840 [29:31<27:31:44, 5.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:10:48,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3855, 'learning_rate': 2.8499999999999998e-05, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:51,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:48,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:51,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:48,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4502, 'learning_rate': 2.86e-05, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:55,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:48,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:10:55,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:48,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 290/17840 [29:41<25:59:23, 5.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:10:58,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:00,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:58,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:00,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:10:58,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 291/17840 [29:46<24:57:37, 5.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 291/17840 [29:46<24:57:37, 5.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 291/17840 [29:46<24:57:37, 5.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:05,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:08,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:08,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:10,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:12,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:12,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:13,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:15,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:15,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:19,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:19,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:20,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:22,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:22,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:24,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:24,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:27,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:27,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:28,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:29,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:29,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:32,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:32,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:36,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:36,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:36,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:40,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:40,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:43,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:43,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:11:43,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:11:02,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [30:32<26:52:55, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:49,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [30:32<26:52:55, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:49,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [30:32<26:52:55, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:49,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [30:32<26:52:55, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:49,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 303/17840 [30:39<29:49:25, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:49,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 303/17840 [30:39<29:49:25, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:49,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 303/17840 [30:39<29:49:25, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:49,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 303/17840 [30:39<29:49:25, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:49,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 303/17840 [30:39<29:49:25, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:49,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [30:47<31:41:58, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:49,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [30:47<31:41:58, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:49,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [30:47<31:41:58, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:49,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [30:47<31:41:58, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:49,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [30:47<31:41:58, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:11:49,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 305/17840 [30:54<32:56:37, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:11,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 305/17840 [30:54<32:56:37, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:11,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 305/17840 [30:54<32:56:37, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:11,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 305/17840 [30:54<32:56:37, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:11,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [31:01<33:39:24, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:11,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [31:01<33:39:24, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:11,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [31:01<33:39:24, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:11,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [31:01<33:39:24, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:11,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [31:01<33:39:24, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:11,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 307/17840 [31:08<34:07:35, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 307/17840 [31:08<34:07:35, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 307/17840 [31:08<34:07:35, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 308/17840 [31:16<34:22:41, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 308/17840 [31:16<34:22:41, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3458, 'learning_rate': 3.05e-05, 'epoch': 0.35} + 2%|█▎ | 308/17840 [31:16<34:22:41, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:38,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:38,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2551, 'learning_rate': 3.06e-05, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:38,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:38,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:38,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 310/17840 [31:30<34:33:47, 7.10s/it]g-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 310/17840 [31:30<34:33:47, 7.10s/it]g-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 310/17840 [31:30<34:33:47, 7.10s/it]g-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:52,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:52,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4772, 'learning_rate': 3.08e-05, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:52,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:52,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:12:52,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 312/17840 [31:44<34:14:22, 7.03s/it]g-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 312/17840 [31:44<34:14:22, 7.03s/it]g-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:05,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 313/17840 [31:51<34:09:41, 7.02s/it]g-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 313/17840 [31:51<34:09:41, 7.02s/it]g-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2806, 'learning_rate': 3.1e-05, 'epoch': 0.35} + 2%|█▎ | 313/17840 [31:51<34:09:41, 7.02s/it]g-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 313/17840 [31:51<34:09:41, 7.02s/it]g-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 313/17840 [31:51<34:09:41, 7.02s/it]g-point operations will not be computed-17 17:12:26,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 314/17840 [31:58<33:54:16, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 314/17840 [31:58<33:54:16, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 314/17840 [31:58<33:54:16, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 315/17840 [32:04<33:41:38, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 315/17840 [32:04<33:41:38, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1763, 'learning_rate': 3.12e-05, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:25,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 316/17840 [32:11<33:33:45, 6.89s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 316/17840 [32:11<33:33:45, 6.89s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3293, 'learning_rate': 3.13e-05, 'epoch': 0.35} + 2%|█▎ | 316/17840 [32:11<33:33:45, 6.89s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 316/17840 [32:11<33:33:45, 6.89s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 316/17840 [32:11<33:33:45, 6.89s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 317/17840 [32:18<33:22:20, 6.86s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:37,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:37,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 318/17840 [32:25<33:14:39, 6.83s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 318/17840 [32:25<33:14:39, 6.83s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2146, 'learning_rate': 3.15e-05, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:45,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 319/17840 [32:32<33:11:24, 6.82s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 319/17840 [32:32<33:11:24, 6.82s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2978, 'learning_rate': 3.16e-05, 'epoch': 0.36} + 2%|█▎ | 319/17840 [32:32<33:11:24, 6.82s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:54,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:54,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2265, 'learning_rate': 3.1700000000000005e-05, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:57,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:13:57,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 321/17840 [32:45<33:03:40, 6.79s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 321/17840 [32:45<33:03:40, 6.79s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3463, 'learning_rate': 3.18e-05, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:06,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 322/17840 [32:52<32:52:02, 6.75s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 322/17840 [32:52<32:52:02, 6.75s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2771, 'learning_rate': 3.19e-05, 'epoch': 0.36} + 2%|█▎ | 322/17840 [32:52<32:52:02, 6.75s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:14,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:14,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1576, 'learning_rate': 3.2000000000000005e-05, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:14,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:14,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 324/17840 [33:05<32:36:43, 6.70s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 324/17840 [33:05<32:36:43, 6.70s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:24,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:24,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 325/17840 [33:14<35:52:15, 7.37s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 325/17840 [33:14<35:52:15, 7.37s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3888, 'learning_rate': 3.2200000000000003e-05, 'epoch': 0.36} + 2%|█▍ | 325/17840 [33:14<35:52:15, 7.37s/it]g-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:36,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:36,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3752, 'learning_rate': 3.2300000000000006e-05, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:36,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:36,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:13:15,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 327/17840 [33:27<33:38:57, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:14:44,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 327/17840 [33:27<33:38:57, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:14:44,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2381, 'learning_rate': 3.24e-05, 'epoch': 0.37} + 2%|█▍ | 327/17840 [33:27<33:38:57, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:14:44,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 328/17840 [33:33<32:50:59, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 328/17840 [33:33<32:50:59, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2241, 'learning_rate': 3.2500000000000004e-05, 'epoch': 0.37} + 2%|█▍ | 328/17840 [33:33<32:50:59, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 329/17840 [33:40<32:14:34, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 329/17840 [33:40<32:14:34, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:59,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:59,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:14:59,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 330/17840 [33:46<31:57:05, 6.57s/it]g-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 331/17840 [33:52<31:28:14, 6.47s/it]g-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 331/17840 [33:52<31:28:14, 6.47s/it]g-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:11,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:11,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:11,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 332/17840 [33:59<30:55:34, 6.36s/it]g-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 332/17840 [33:59<30:55:34, 6.36s/it]g-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:19,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 333/17840 [34:05<30:29:40, 6.27s/it]g-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 333/17840 [34:05<30:29:40, 6.27s/it]g-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:23,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:23,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 334/17840 [34:11<29:56:01, 6.16s/it]g-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 334/17840 [34:11<29:56:01, 6.16s/it]g-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:29,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:29,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:14:51,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 335/17840 [34:16<29:23:40, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 335/17840 [34:16<29:23:40, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.492, 'learning_rate': 3.32e-05, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:38,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:38,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2488, 'learning_rate': 3.33e-05, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:42,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:42,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 337/17840 [34:28<28:26:34, 5.85s/it]g-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:46,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:46,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:46,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 338/17840 [34:33<27:48:49, 5.72s/it]g-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:51,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:54,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:54,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2123, 'learning_rate': 3.3600000000000004e-05, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:58,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:15:58,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 340/17840 [34:43<26:27:11, 5.44s/it]g-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:02,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:04,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:04,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:06,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:08,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:08,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3917, 'learning_rate': 3.3900000000000004e-05, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:12,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:12,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:15:33,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 343/17840 [34:57<23:20:41, 4.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:14,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:16,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:14,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:16,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:14,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 344/17840 [35:01<22:11:28, 4.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:18,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 345/17840 [35:05<20:51:03, 4.29s/it]g-point operations will not be computed-17 17:16:18,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 345/17840 [35:05<20:51:03, 4.29s/it]g-point operations will not be computed-17 17:16:18,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 345/17840 [35:05<20:51:03, 4.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:21,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 345/17840 [35:05<20:51:03, 4.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:21,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 346/17840 [35:08<19:19:35, 3.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:24,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 347/17840 [35:11<17:50:37, 3.67s/it]g-point operations will not be computed-17 17:16:24,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 347/17840 [35:11<17:50:37, 3.67s/it]g-point operations will not be computed-17 17:16:24,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:29,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:27,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:29,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:27,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 348/17840 [35:14<16:23:45, 3.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:30,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 348/17840 [35:14<16:23:45, 3.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:30,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 349/17840 [35:16<14:56:02, 3.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:32,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:33,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:32,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:33,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:32,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 350/17840 [35:20<16:15:04, 3.35s/it]g-point operations will not be computed-17 17:16:32,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 350/17840 [35:20<16:15:04, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:38,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 350/17840 [35:20<16:15:04, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:38,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:42,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:38,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:42,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:38,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 351/17840 [35:28<23:15:23, 4.79s/it]g-point operations will not be computed-17 17:16:38,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 351/17840 [35:28<23:15:23, 4.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 351/17840 [35:28<23:15:23, 4.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 351/17840 [35:28<23:15:23, 4.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 351/17840 [35:28<23:15:23, 4.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 352/17840 [35:36<27:24:59, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 352/17840 [35:36<27:24:59, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 352/17840 [35:36<27:24:59, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:59,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:59,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2437, 'learning_rate': 3.5e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:59,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:16:59,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 354/17840 [35:51<32:00:14, 6.59s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 354/17840 [35:51<32:00:14, 6.59s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2521, 'learning_rate': 3.51e-05, 'epoch': 0.4} + 2%|█▌ | 354/17840 [35:51<32:00:14, 6.59s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 354/17840 [35:51<32:00:14, 6.59s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 354/17840 [35:51<32:00:14, 6.59s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 355/17840 [35:58<33:12:29, 6.84s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 355/17840 [35:58<33:12:29, 6.84s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 355/17840 [35:58<33:12:29, 6.84s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:17:21,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:17:21,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1411, 'learning_rate': 3.53e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-17 17:17:21,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:17:21,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:17:21,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 357/17840 [36:13<34:24:46, 7.09s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 357/17840 [36:13<34:24:46, 7.09s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 357/17840 [36:13<34:24:46, 7.09s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:17:36,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:17:36,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2485, 'learning_rate': 3.55e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-17 17:17:36,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:17:36,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 359/17840 [36:28<35:00:27, 7.21s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 359/17840 [36:28<35:00:27, 7.21s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2304, 'learning_rate': 3.56e-05, 'epoch': 0.4} + 2%|█▌ | 359/17840 [36:28<35:00:27, 7.21s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:17:50,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:17:50,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3708, 'learning_rate': 3.57e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-17 17:17:50,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:17:50,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 361/17840 [36:42<34:44:02, 7.15s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 361/17840 [36:42<34:44:02, 7.15s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2478, 'learning_rate': 3.58e-05, 'epoch': 0.4} + 2%|█▌ | 361/17840 [36:42<34:44:02, 7.15s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:04,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:04,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2039, 'learning_rate': 3.59e-05, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:04,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:04,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 363/17840 [36:56<34:28:17, 7.10s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 363/17840 [36:56<34:28:17, 7.10s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1941, 'learning_rate': 3.6e-05, 'epoch': 0.41} + 2%|█▌ | 363/17840 [36:56<34:28:17, 7.10s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:18,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:18,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3788, 'learning_rate': 3.61e-05, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:18,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:18,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 365/17840 [37:10<34:12:02, 7.05s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 365/17840 [37:10<34:12:02, 7.05s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:29,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:29,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 366/17840 [37:17<33:53:27, 6.98s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 366/17840 [37:17<33:53:27, 6.98s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2629, 'learning_rate': 3.63e-05, 'epoch': 0.41} + 2%|█▌ | 366/17840 [37:17<33:53:27, 6.98s/it]g-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:39,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:39,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2057, 'learning_rate': 3.6400000000000004e-05, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:39,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:39,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:16:46,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 368/17840 [37:30<33:25:50, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:18:47,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 368/17840 [37:30<33:25:50, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:18:47,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3006, 'learning_rate': 3.65e-05, 'epoch': 0.41} + 2%|█▌ | 368/17840 [37:30<33:25:50, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:18:47,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 369/17840 [37:37<33:15:31, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:18:47,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 369/17840 [37:37<33:15:31, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:18:47,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3781, 'learning_rate': 3.66e-05, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-17 17:18:58,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:18:47,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 370/17840 [37:44<33:04:14, 6.81s/it]g-point operations will not be computed-17 17:18:47,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 370/17840 [37:44<33:04:14, 6.81s/it]g-point operations will not be computed-17 17:18:47,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3337, 'learning_rate': 3.6700000000000004e-05, 'epoch': 0.41} + 2%|█▌ | 370/17840 [37:44<33:04:14, 6.81s/it]g-point operations will not be computed-17 17:18:47,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|��▌ | 370/17840 [37:44<33:04:14, 6.81s/it]g-point operations will not be computed-17 17:18:47,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 370/17840 [37:44<33:04:14, 6.81s/it]g-point operations will not be computed-17 17:18:47,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [37:50<32:58:24, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [37:50<32:58:24, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [37:50<32:58:24, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [37:50<32:58:24, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 372/17840 [37:57<32:48:18, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:16,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:16,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:16,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 373/17840 [38:04<32:37:13, 6.72s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 373/17840 [38:04<32:37:13, 6.72s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 373/17840 [38:04<32:37:13, 6.72s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:26,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:26,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4384, 'learning_rate': 3.71e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:26,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:26,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:26,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 375/17840 [38:19<35:29:19, 7.32s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 375/17840 [38:19<35:29:19, 7.32s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:40,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:40,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 376/17840 [38:26<34:20:21, 7.08s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 376/17840 [38:26<34:20:21, 7.08s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:46,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:46,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 377/17840 [38:32<33:18:12, 6.87s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 377/17840 [38:32<33:18:12, 6.87s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:52,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:19:52,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 378/17840 [38:38<32:32:10, 6.71s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 378/17840 [38:38<32:32:10, 6.71s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 378/17840 [38:38<32:32:10, 6.71s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 378/17840 [38:38<32:32:10, 6.71s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:00,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:00,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:05,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:05,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 380/17840 [38:51<31:23:30, 6.47s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 380/17840 [38:51<31:23:30, 6.47s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:11,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:11,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 381/17840 [38:57<30:56:23, 6.38s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 381/17840 [38:57<30:56:23, 6.38s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 381/17840 [38:57<30:56:23, 6.38s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 381/17840 [38:57<30:56:23, 6.38s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:19,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:19,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:19,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:19,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:25,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:25,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:29,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:29,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 384/17840 [39:15<29:37:35, 6.11s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 384/17840 [39:15<29:37:35, 6.11s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:35,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:35,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 385/17840 [39:21<29:05:55, 6.00s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:39,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:39,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:39,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 386/17840 [39:26<28:37:20, 5.90s/it]g-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:45,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:45,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:45,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:19:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 387/17840 [39:32<28:01:50, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:20:49,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:49,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:49,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 388/17840 [39:37<27:24:36, 5.65s/it]g-point operations will not be computed-17 17:20:49,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:55,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:49,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:55,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:49,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:20:55,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:49,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 389/17840 [39:43<26:50:26, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:20:59,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 389/17840 [39:43<26:50:26, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:20:59,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 389/17840 [39:43<26:50:26, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:20:59,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:03,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:59,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:06,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:59,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:08,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:59,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:08,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:59,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5114, 'learning_rate': 3.88e-05, 'epoch': 0.44} +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:11,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:59,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:11,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:20:59,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 392/17840 [39:57<24:24:39, 5.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 392/17840 [39:57<24:24:39, 5.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 392/17840 [39:57<24:24:39, 5.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:17,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:19,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:19,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:21,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:23,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:23,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:25,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:28,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:30,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:30,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:31,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:34,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:34,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:36,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:36,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:37,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:40,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:40,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6483, 'learning_rate': 3.97e-05, 'epoch': 0.45} +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:44,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:44,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:44,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:48,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:48,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:52,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:52,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:21:52,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [40:40<26:57:10, 5.56s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [40:40<26:57:10, 5.56s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [40:40<26:57:10, 5.56s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [40:40<26:57:10, 5.56s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [40:40<26:57:10, 5.56s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 403/17840 [40:47<29:41:57, 6.13s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:07,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:07,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 404/17840 [40:55<31:31:09, 6.51s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 404/17840 [40:55<31:31:09, 6.51s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2613, 'learning_rate': 4.0100000000000006e-05, 'epoch': 0.45} + 2%|█▋ | 404/17840 [40:55<31:31:09, 6.51s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 404/17840 [40:55<31:31:09, 6.51s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 404/17840 [40:55<31:31:09, 6.51s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 405/17840 [41:02<32:42:47, 6.75s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 405/17840 [41:02<32:42:47, 6.75s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:23,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 406/17840 [41:09<33:21:41, 6.89s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 406/17840 [41:09<33:21:41, 6.89s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3065, 'learning_rate': 4.0300000000000004e-05, 'epoch': 0.46} + 2%|█▋ | 406/17840 [41:09<33:21:41, 6.89s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 406/17840 [41:09<33:21:41, 6.89s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 406/17840 [41:09<33:21:41, 6.89s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [41:16<33:50:18, 6.99s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [41:16<33:50:18, 6.99s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [41:16<33:50:18, 6.99s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [41:16<33:50:18, 6.99s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [41:16<33:50:18, 6.99s/it]g-point operations will not be computed-17 17:21:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 408/17840 [41:24<34:14:15, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 408/17840 [41:24<34:14:15, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 408/17840 [41:24<34:14:15, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 409/17840 [41:31<34:14:45, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 409/17840 [41:31<34:14:45, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4455, 'learning_rate': 4.0600000000000004e-05, 'epoch': 0.46} + 2%|█▋ | 409/17840 [41:31<34:14:45, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:53,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:53,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3346, 'learning_rate': 4.07e-05, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:53,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:53,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:22:53,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 411/17840 [41:45<34:15:55, 7.08s/it]g-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 411/17840 [41:45<34:15:55, 7.08s/it]g-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 411/17840 [41:45<34:15:55, 7.08s/it]g-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:07,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:07,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.271, 'learning_rate': 4.09e-05, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:07,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:07,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:07,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 413/17840 [41:59<33:53:00, 7.00s/it]g-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:18,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:18,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 414/17840 [42:06<33:50:04, 6.99s/it]g-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 414/17840 [42:06<33:50:04, 6.99s/it]g-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1533, 'learning_rate': 4.11e-05, 'epoch': 0.46} + 2%|█▊ | 414/17840 [42:06<33:50:04, 6.99s/it]g-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:28,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:28,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1654, 'learning_rate': 4.12e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:28,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:28,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 416/17840 [42:20<33:28:22, 6.92s/it]g-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 416/17840 [42:20<33:28:22, 6.92s/it]g-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:38,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:38,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 417/17840 [42:26<33:14:56, 6.87s/it]g-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 417/17840 [42:26<33:14:56, 6.87s/it]g-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2844, 'learning_rate': 4.14e-05, 'epoch': 0.47} + 2%|█▊ | 417/17840 [42:26<33:14:56, 6.87s/it]g-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:49,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:49,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3859, 'learning_rate': 4.15e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:49,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:49,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:23:49,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:22:41,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [42:40<32:59:07, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:57,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [42:40<32:59:07, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:57,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [42:40<32:59:07, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:57,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 420/17840 [42:46<32:41:36, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:57,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 420/17840 [42:46<32:41:36, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:23:57,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.281, 'learning_rate': 4.17e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:07,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 421/17840 [42:53<32:26:28, 6.70s/it]g-point operations will not be computed-17 17:23:57,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 421/17840 [42:53<32:26:28, 6.70s/it]g-point operations will not be computed-17 17:23:57,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.296, 'learning_rate': 4.18e-05, 'epoch': 0.47} + 2%|█▊ | 421/17840 [42:53<32:26:28, 6.70s/it]g-point operations will not be computed-17 17:23:57,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:15,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:15,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3627, 'learning_rate': 4.19e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:15,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:15,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:15,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:23:57,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 423/17840 [43:06<32:09:32, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:23,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 423/17840 [43:06<32:09:32, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:23,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 423/17840 [43:06<32:09:32, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:23,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 424/17840 [43:13<32:09:00, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:23,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 424/17840 [43:13<32:09:00, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:23,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:32,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:23,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:32,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:23,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 425/17840 [43:22<35:27:08, 7.33s/it]g-point operations will not be computed-17 17:24:23,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 425/17840 [43:22<35:27:08, 7.33s/it]g-point operations will not be computed-17 17:24:23,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4026, 'learning_rate': 4.22e-05, 'epoch': 0.48} + 2%|█▊ | 425/17840 [43:22<35:27:08, 7.33s/it]g-point operations will not be computed-17 17:24:23,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 425/17840 [43:22<35:27:08, 7.33s/it]g-point operations will not be computed-17 17:24:23,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 425/17840 [43:22<35:27:08, 7.33s/it]g-point operations will not be computed-17 17:24:23,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 426/17840 [43:28<34:11:39, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 426/17840 [43:28<34:11:39, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 426/17840 [43:28<34:11:39, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 427/17840 [43:35<33:13:21, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 427/17840 [43:35<33:13:21, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:53,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:24:53,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 428/17840 [43:41<32:28:45, 6.72s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 428/17840 [43:41<32:28:45, 6.72s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:00,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:00,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 429/17840 [43:47<31:59:31, 6.61s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 429/17840 [43:47<31:59:31, 6.61s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:06,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:06,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 430/17840 [43:54<31:28:23, 6.51s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 430/17840 [43:54<31:28:23, 6.51s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:12,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:12,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 431/17840 [44:00<31:02:32, 6.42s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 431/17840 [44:00<31:02:32, 6.42s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:18,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:18,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 432/17840 [44:06<30:42:18, 6.35s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 432/17840 [44:06<30:42:18, 6.35s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:25,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:25,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 433/17840 [44:12<30:26:17, 6.30s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 433/17840 [44:12<30:26:17, 6.30s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0756, 'learning_rate': 4.3e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:32,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 434/17840 [44:18<30:04:30, 6.22s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 434/17840 [44:18<30:04:30, 6.22s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:37,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:37,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 435/17840 [44:24<29:30:04, 6.10s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 435/17840 [44:24<29:30:04, 6.10s/it]g-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:42,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:42,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:24:45,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 436/17840 [44:30<28:56:56, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:47,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 436/17840 [44:30<28:56:56, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:25:47,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4725, 'learning_rate': 4.33e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:51,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:47,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:51,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:47,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4726, 'learning_rate': 4.3400000000000005e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-17 17:25:55,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:47,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 438/17840 [44:41<27:57:13, 5.78s/it]g-point operations will not be computed-17 17:25:47,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 438/17840 [44:41<27:57:13, 5.78s/it]g-point operations will not be computed-17 17:25:47,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3749, 'learning_rate': 4.35e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:01,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:47,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 439/17840 [44:47<27:44:51, 5.74s/it]g-point operations will not be computed-17 17:25:47,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 439/17840 [44:47<27:44:51, 5.74s/it]g-point operations will not be computed-17 17:25:47,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:05,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:47,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:07,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:47,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:07,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:47,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.311, 'learning_rate': 4.3700000000000005e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:11,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:25:47,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 441/17840 [44:57<25:53:29, 5.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 441/17840 [44:57<25:53:29, 5.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:16,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 442/17840 [45:01<24:52:57, 5.15s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 442/17840 [45:01<24:52:57, 5.15s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:19,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:19,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:23,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:23,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:25,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:27,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:27,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:29,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:31,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:31,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:34,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:34,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:35,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:35,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:38,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:40,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:40,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:41,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:44,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:44,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9419, 'learning_rate': 4.47e-05, 'epoch': 0.5} +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:48,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:48,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:48,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:52,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:52,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:56,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:56,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:26:56,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 452/17840 [45:44<26:56:39, 5.58s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 452/17840 [45:44<26:56:39, 5.58s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 452/17840 [45:44<26:56:39, 5.58s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 452/17840 [45:44<26:56:39, 5.58s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 452/17840 [45:44<26:56:39, 5.58s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 453/17840 [45:52<29:45:34, 6.16s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:11,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:11,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:11,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 454/17840 [45:59<31:26:06, 6.51s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 454/17840 [45:59<31:26:06, 6.51s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 454/17840 [45:59<31:26:06, 6.51s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 454/17840 [45:59<31:26:06, 6.51s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 454/17840 [45:59<31:26:06, 6.51s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 455/17840 [46:06<32:39:10, 6.76s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 455/17840 [46:06<32:39:10, 6.76s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 455/17840 [46:06<32:39:10, 6.76s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:29,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:29,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3515, 'learning_rate': 4.53e-05, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:29,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:29,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:29,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 457/17840 [46:21<34:06:10, 7.06s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 457/17840 [46:21<34:06:10, 7.06s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 457/17840 [46:21<34:06:10, 7.06s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 457/17840 [46:21<34:06:10, 7.06s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 457/17840 [46:21<34:06:10, 7.06s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 458/17840 [46:28<34:25:33, 7.13s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:48,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:48,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:27:48,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 459/17840 [46:36<34:36:34, 7.17s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 459/17840 [46:36<34:36:34, 7.17s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 459/17840 [46:36<34:36:34, 7.17s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 459/17840 [46:36<34:36:34, 7.17s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 459/17840 [46:36<34:36:34, 7.17s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 460/17840 [46:43<34:31:33, 7.15s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:02,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:02,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 461/17840 [46:50<34:21:25, 7.12s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 461/17840 [46:50<34:21:25, 7.12s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1781, 'learning_rate': 4.58e-05, 'epoch': 0.52} + 3%|█▉ | 461/17840 [46:50<34:21:25, 7.12s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 461/17840 [46:50<34:21:25, 7.12s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 461/17840 [46:50<34:21:25, 7.12s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 462/17840 [46:57<34:25:39, 7.13s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:16,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:16,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 463/17840 [47:04<34:13:06, 7.09s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 463/17840 [47:04<34:13:06, 7.09s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2587, 'learning_rate': 4.600000000000001e-05, 'epoch': 0.52} + 3%|█▉ | 463/17840 [47:04<34:13:06, 7.09s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:26,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:26,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1396, 'learning_rate': 4.61e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:26,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:26,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:26,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 465/17840 [47:18<33:49:37, 7.01s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 465/17840 [47:18<33:49:37, 7.01s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:38,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 466/17840 [47:25<33:39:55, 6.98s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 466/17840 [47:25<33:39:55, 6.98s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3356, 'learning_rate': 4.630000000000001e-05, 'epoch': 0.52} + 3%|█▉ | 466/17840 [47:25<33:39:55, 6.98s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 466/17840 [47:25<33:39:55, 6.98s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 466/17840 [47:25<33:39:55, 6.98s/it]g-point operations will not be computed-17 17:26:13,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 467/17840 [47:32<33:24:40, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 467/17840 [47:32<33:24:40, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 467/17840 [47:32<33:24:40, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 467/17840 [47:32<33:24:40, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 468/17840 [47:38<33:08:02, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:57,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:28:57,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 469/17840 [47:45<32:58:11, 6.83s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 469/17840 [47:45<32:58:11, 6.83s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2979, 'learning_rate': 4.660000000000001e-05, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:05,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 470/17840 [47:52<32:41:33, 6.78s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 470/17840 [47:52<32:41:33, 6.78s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3177, 'learning_rate': 4.6700000000000003e-05, 'epoch': 0.53} + 3%|██ | 470/17840 [47:52<32:41:33, 6.78s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:14,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:14,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1592, 'learning_rate': 4.6800000000000006e-05, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:17,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:17,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 472/17840 [48:05<32:27:59, 6.73s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 472/17840 [48:05<32:27:59, 6.73s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1543, 'learning_rate': 4.69e-05, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:25,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 473/17840 [48:12<32:13:12, 6.68s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 473/17840 [48:12<32:13:12, 6.68s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4002, 'learning_rate': 4.7e-05, 'epoch': 0.53} + 3%|██ | 473/17840 [48:12<32:13:12, 6.68s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:34,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:34,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3175, 'learning_rate': 4.71e-05, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:34,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:34,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 475/17840 [48:27<35:08:06, 7.28s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 475/17840 [48:27<35:08:06, 7.28s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2417, 'learning_rate': 4.72e-05, 'epoch': 0.53} + 3%|██ | 475/17840 [48:27<35:08:06, 7.28s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 475/17840 [48:27<35:08:06, 7.28s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 476/17840 [48:33<33:59:51, 7.05s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 476/17840 [48:33<33:59:51, 7.05s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 477/17840 [48:40<32:53:02, 6.82s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 477/17840 [48:40<32:53:02, 6.82s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:58,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:29:58,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 478/17840 [48:46<32:08:55, 6.67s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 478/17840 [48:46<32:08:55, 6.67s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:05,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:05,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 479/17840 [48:52<31:32:30, 6.54s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 479/17840 [48:52<31:32:30, 6.54s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1042, 'learning_rate': 4.76e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:12,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 480/17840 [48:58<31:06:30, 6.45s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 480/17840 [48:58<31:06:30, 6.45s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3297, 'learning_rate': 4.77e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:19,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 481/17840 [49:05<30:57:57, 6.42s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 481/17840 [49:05<30:57:57, 6.42s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2246, 'learning_rate': 4.78e-05, 'epoch': 0.54} + 3%|██ | 481/17840 [49:05<30:57:57, 6.42s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:27,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:27,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2478, 'learning_rate': 4.79e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:27,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:27,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 483/17840 [49:19<32:23:06, 6.72s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 483/17840 [49:19<32:23:06, 6.72s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3329, 'learning_rate': 4.8e-05, 'epoch': 0.54} + 3%|██ | 483/17840 [49:19<32:23:06, 6.72s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:41,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:41,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2585, 'learning_rate': 4.8100000000000004e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:45,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 485/17840 [49:31<30:37:05, 6.35s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 485/17840 [49:31<30:37:05, 6.35s/it]g-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:49,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:49,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:28:49,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 486/17840 [49:37<29:35:57, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 486/17840 [49:37<29:35:57, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.211, 'learning_rate': 4.83e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:58,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:30:58,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1027, 'learning_rate': 4.8400000000000004e-05, 'epoch': 0.55} +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:02,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 488/17840 [49:47<27:48:49, 5.77s/it]g-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 488/17840 [49:47<27:48:49, 5.77s/it]g-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:06,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:08,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:08,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:08,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:12,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 490/17840 [49:58<25:57:06, 5.38s/it]g-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 490/17840 [49:58<25:57:06, 5.38s/it]g-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:15,923 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:18,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:18,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1914, 'learning_rate': 4.88e-05, 'epoch': 0.55} +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:21,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:21,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:30:54,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 492/17840 [50:07<23:52:55, 4.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:31:23,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:25,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:23,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:25,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:23,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 493/17840 [50:11<22:35:25, 4.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:31:27,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 494/17840 [50:14<21:12:08, 4.40s/it]g-point operations will not be computed-17 17:31:27,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 494/17840 [50:14<21:12:08, 4.40s/it]g-point operations will not be computed-17 17:31:27,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 494/17840 [50:14<21:12:08, 4.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:31:31,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 495/17840 [50:18<19:44:13, 4.10s/it]g-point operations will not be computed-17 17:31:31,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 495/17840 [50:18<19:44:13, 4.10s/it]g-point operations will not be computed-17 17:31:31,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:36,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:34,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:36,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:34,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 496/17840 [50:21<18:14:03, 3.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:31:37,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 497/17840 [50:24<16:49:54, 3.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:31:40,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 497/17840 [50:24<16:49:54, 3.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:31:40,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 498/17840 [50:26<15:26:57, 3.21s/it]g-point operations will not be computed-17 17:31:40,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 498/17840 [50:26<15:26:57, 3.21s/it]g-point operations will not be computed-17 17:31:40,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7833, 'learning_rate': 4.9500000000000004e-05, 'epoch': 0.56} + 3%|██▏ | 499/17840 [50:29<14:12:46, 2.95s/it]g-point operations will not be computed-17 17:31:42,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:46,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:45,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 500/17840 [50:33<15:42:46, 3.26s/it]g-point operations will not be computed-17 17:31:45,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 500/17840 [50:33<15:42:46, 3.26s/it]g-point operations will not be computed-17 17:31:45,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 500/17840 [50:33<15:42:46, 3.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:31:50,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 500/17840 [50:33<15:42:46, 3.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:31:50,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:54,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:50,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:31:54,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:50,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 501/17840 [50:40<22:24:52, 4.65s/it]g-point operations will not be computed-17 17:31:50,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 501/17840 [50:40<22:24:52, 4.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 501/17840 [50:40<22:24:52, 4.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:02,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:02,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [50:48<26:43:32, 5.55s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [50:48<26:43:32, 5.55s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [50:48<26:43:32, 5.55s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [50:48<26:43:32, 5.55s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 503/17840 [50:56<29:25:47, 6.11s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 503/17840 [50:56<29:25:47, 6.11s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:15,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:15,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:15,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 504/17840 [51:03<31:10:41, 6.47s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 504/17840 [51:03<31:10:41, 6.47s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 504/17840 [51:03<31:10:41, 6.47s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 504/17840 [51:03<31:10:41, 6.47s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 504/17840 [51:03<31:10:41, 6.47s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 505/17840 [51:10<32:26:17, 6.74s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 505/17840 [51:10<32:26:17, 6.74s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:31,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:31,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [51:17<33:06:42, 6.88s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [51:17<33:06:42, 6.88s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [51:17<33:06:42, 6.88s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [51:17<33:06:42, 6.88s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [51:17<33:06:42, 6.88s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 507/17840 [51:25<33:36:54, 6.98s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 507/17840 [51:25<33:36:54, 6.98s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 507/17840 [51:25<33:36:54, 6.98s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:47,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:47,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3685, 'learning_rate': 5.05e-05, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:47,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:47,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:32:47,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [51:39<34:05:28, 7.08s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [51:39<34:05:28, 7.08s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [51:39<34:05:28, 7.08s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:02,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:02,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4934, 'learning_rate': 5.0700000000000006e-05, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:02,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:02,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:02,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 511/17840 [51:53<34:03:33, 7.08s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 511/17840 [51:53<34:03:33, 7.08s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:14,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 512/17840 [52:00<34:07:14, 7.09s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 512/17840 [52:00<34:07:14, 7.09s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2927, 'learning_rate': 5.0900000000000004e-05, 'epoch': 0.57} + 3%|██▏ | 512/17840 [52:00<34:07:14, 7.09s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 512/17840 [52:00<34:07:14, 7.09s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 512/17840 [52:00<34:07:14, 7.09s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 513/17840 [52:07<33:56:16, 7.05s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:26,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:26,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:26,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 514/17840 [52:14<33:51:29, 7.04s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 514/17840 [52:14<33:51:29, 7.04s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:35,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 515/17840 [52:21<33:37:47, 6.99s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 515/17840 [52:21<33:37:47, 6.99s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3176, 'learning_rate': 5.1200000000000004e-05, 'epoch': 0.58} + 3%|██▏ | 515/17840 [52:21<33:37:47, 6.99s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 515/17840 [52:21<33:37:47, 6.99s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 515/17840 [52:21<33:37:47, 6.99s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 516/17840 [52:28<33:29:03, 6.96s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 516/17840 [52:28<33:29:03, 6.96s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:49,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 517/17840 [52:35<33:16:25, 6.91s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 517/17840 [52:35<33:16:25, 6.91s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3672, 'learning_rate': 5.14e-05, 'epoch': 0.58} + 3%|██▏ | 517/17840 [52:35<33:16:25, 6.91s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:57,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:57,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2829, 'learning_rate': 5.1500000000000005e-05, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:57,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:57,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:33:57,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 519/17840 [52:48<32:56:14, 6.85s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:07,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:07,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 520/17840 [52:55<32:47:56, 6.82s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 520/17840 [52:55<32:47:56, 6.82s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2634, 'learning_rate': 5.17e-05, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:16,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 521/17840 [53:02<32:40:25, 6.79s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 521/17840 [53:02<32:40:25, 6.79s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2429, 'learning_rate': 5.1800000000000005e-05, 'epoch': 0.58} + 3%|██▏ | 521/17840 [53:02<32:40:25, 6.79s/it]g-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:24,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:24,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1855, 'learning_rate': 5.19e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:24,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:24,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:24,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:31:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 523/17840 [53:15<32:11:36, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:34:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 523/17840 [53:15<32:11:36, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:34:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 523/17840 [53:15<32:11:36, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:34:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 524/17840 [53:22<32:02:01, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:34:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 524/17840 [53:22<32:02:01, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:34:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3319, 'learning_rate': 5.2100000000000006e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:42,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 525/17840 [53:31<35:16:18, 7.33s/it]g-point operations will not be computed-17 17:34:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 525/17840 [53:31<35:16:18, 7.33s/it]g-point operations will not be computed-17 17:34:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4304, 'learning_rate': 5.22e-05, 'epoch': 0.59} + 3%|██▏ | 525/17840 [53:31<35:16:18, 7.33s/it]g-point operations will not be computed-17 17:34:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:53,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:53,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1157, 'learning_rate': 5.2300000000000004e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:53,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:53,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:34:53,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:34:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 527/17840 [53:43<33:02:18, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:01,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 527/17840 [53:43<33:02:18, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:01,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 527/17840 [53:43<33:02:18, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:01,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 527/17840 [53:43<33:02:18, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:01,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 528/17840 [53:50<32:11:51, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 528/17840 [53:50<32:11:51, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 528/17840 [53:50<32:11:51, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 529/17840 [53:56<31:45:30, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 529/17840 [53:56<31:45:30, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:15,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:15,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 530/17840 [54:02<31:26:20, 6.54s/it]g-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 530/17840 [54:02<31:26:20, 6.54s/it]g-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5276, 'learning_rate': 5.270000000000001e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:23,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 531/17840 [54:09<30:50:20, 6.41s/it]g-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 531/17840 [54:09<30:50:20, 6.41s/it]g-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:27,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:27,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 532/17840 [54:15<30:22:29, 6.32s/it]g-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 532/17840 [54:15<30:22:29, 6.32s/it]g-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:33,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:33,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 533/17840 [54:21<29:53:33, 6.22s/it]g-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 533/17840 [54:21<29:53:33, 6.22s/it]g-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:39,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:39,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:07,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 534/17840 [54:27<29:18:48, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:43,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 534/17840 [54:27<29:18:48, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:35:43,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1762, 'learning_rate': 5.31e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:48,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:43,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:48,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:43,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3117, 'learning_rate': 5.3200000000000006e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:52,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:43,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 536/17840 [54:38<28:23:58, 5.91s/it]g-point operations will not be computed-17 17:35:43,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 536/17840 [54:38<28:23:58, 5.91s/it]g-point operations will not be computed-17 17:35:43,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3505, 'learning_rate': 5.330000000000001e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-17 17:35:58,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:43,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 537/17840 [54:44<28:01:45, 5.83s/it]g-point operations will not be computed-17 17:35:43,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 537/17840 [54:44<28:01:45, 5.83s/it]g-point operations will not be computed-17 17:35:43,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:02,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:43,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:02,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:35:43,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 538/17840 [54:49<27:21:26, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:06,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 538/17840 [54:49<27:21:26, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:06,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.535, 'learning_rate': 5.3500000000000006e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:10,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:06,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:10,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:06,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2488, 'learning_rate': 5.360000000000001e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:13,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:06,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 540/17840 [54:59<25:41:40, 5.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:16,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 540/17840 [54:59<25:41:40, 5.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:16,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:18,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:16,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 541/17840 [55:04<24:28:59, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:20,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 541/17840 [55:04<24:28:59, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:20,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:22,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:20,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 542/17840 [55:08<23:15:19, 4.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:24,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 542/17840 [55:08<23:15:19, 4.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:24,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:26,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:24,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 543/17840 [55:12<21:53:05, 4.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:28,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 543/17840 [55:12<21:53:05, 4.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:28,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:30,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:28,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 544/17840 [55:15<20:23:43, 4.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:32,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 544/17840 [55:15<20:23:43, 4.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:32,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 545/17840 [55:18<18:50:14, 3.92s/it]g-point operations will not be computed-17 17:36:32,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 545/17840 [55:18<18:50:14, 3.92s/it]g-point operations will not be computed-17 17:36:32,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:36,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:35,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 546/17840 [55:21<17:28:55, 3.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:38,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 546/17840 [55:21<17:28:55, 3.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:38,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 547/17840 [55:24<16:17:06, 3.39s/it]g-point operations will not be computed-17 17:36:38,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 547/17840 [55:24<16:17:06, 3.39s/it]g-point operations will not be computed-17 17:36:38,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 548/17840 [55:27<15:06:32, 3.15s/it]g-point operations will not be computed-17 17:36:40,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:44,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:43,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:44,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:43,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:46,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:45,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:46,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:45,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2853, 'learning_rate': 5.4600000000000006e-05, 'epoch': 0.62} + 3%|██▎ | 550/17840 [55:33<15:18:33, 3.19s/it]g-point operations will not be computed-17 17:36:45,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 550/17840 [55:33<15:18:33, 3.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:51,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:36:54,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:51,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 551/17840 [55:41<22:01:37, 4.59s/it]g-point operations will not be computed-17 17:36:51,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 551/17840 [55:41<22:01:37, 4.59s/it]g-point operations will not be computed-17 17:36:51,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 551/17840 [55:41<22:01:37, 4.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 551/17840 [55:41<22:01:37, 4.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:36:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:02,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:36:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 552/17840 [55:48<26:22:29, 5.49s/it]g-point operations will not be computed-17 17:36:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 552/17840 [55:48<26:22:29, 5.49s/it]g-point operations will not be computed-17 17:36:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 552/17840 [55:48<26:22:29, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 552/17840 [55:48<26:22:29, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 552/17840 [55:48<26:22:29, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 553/17840 [55:56<29:16:35, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 553/17840 [55:56<29:16:35, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3751, 'learning_rate': 5.500000000000001e-05, 'epoch': 0.62} + 3%|██▎ | 553/17840 [55:56<29:16:35, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:19,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:19,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2776, 'learning_rate': 5.5100000000000004e-05, 'epoch': 0.62} +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:19,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:19,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:37:19,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 555/17840 [56:11<32:17:39, 6.73s/it]g-point operations will not be computed-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 555/17840 [56:11<32:17:39, 6.73s/it]g-point operations will not be computed-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 555/17840 [56:11<32:17:39, 6.73s/it]g-point operations will not be computed-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 555/17840 [56:11<32:17:39, 6.73s/it]g-point operations will not be computed-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 555/17840 [56:11<32:17:39, 6.73s/it]g-point operations will not be computed-17 17:37:06,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [56:18<33:12:43, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:35,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [56:18<33:12:43, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:35,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [56:18<33:12:43, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:35,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [56:18<33:12:43, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:35,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 557/17840 [56:25<33:38:25, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:35,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 557/17840 [56:25<33:38:25, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:35,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 557/17840 [56:25<33:38:25, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:35,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 557/17840 [56:25<33:38:25, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:35,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 557/17840 [56:25<33:38:25, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:35,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 558/17840 [56:32<33:54:24, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 558/17840 [56:32<33:54:24, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 558/17840 [56:32<33:54:24, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 558/17840 [56:32<33:54:24, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 559/17840 [56:40<34:06:52, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 559/17840 [56:40<34:06:52, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 559/17840 [56:40<34:06:52, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 559/17840 [56:40<34:06:52, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 559/17840 [56:40<34:06:52, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 560/17840 [56:47<34:05:40, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:06,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:06,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:06,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 561/17840 [56:54<33:58:45, 7.08s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 561/17840 [56:54<33:58:45, 7.08s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 561/17840 [56:54<33:58:45, 7.08s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:16,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:16,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2875, 'learning_rate': 5.590000000000001e-05, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:16,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:16,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:16,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 563/17840 [57:08<33:39:26, 7.01s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:27,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:27,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [57:14<33:25:15, 6.96s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [57:14<33:25:15, 6.96s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2504, 'learning_rate': 5.610000000000001e-05, 'epoch': 0.63} + 3%|██▍ | 564/17840 [57:14<33:25:15, 6.96s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:37,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:37,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3606, 'learning_rate': 5.620000000000001e-05, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:37,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:37,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:37,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 566/17840 [57:28<33:10:02, 6.91s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 566/17840 [57:28<33:10:02, 6.91s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:49,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [57:35<33:06:56, 6.90s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [57:35<33:06:56, 6.90s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2408, 'learning_rate': 5.6399999999999995e-05, 'epoch': 0.64} + 3%|██▍ | 567/17840 [57:35<33:06:56, 6.90s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:57,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:57,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2025, 'learning_rate': 5.65e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:57,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:57,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:38:57,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 569/17840 [57:49<32:41:45, 6.82s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:07,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:07,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 570/17840 [57:55<32:43:54, 6.82s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 570/17840 [57:55<32:43:54, 6.82s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.284, 'learning_rate': 5.6699999999999996e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:16,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 571/17840 [58:02<32:30:12, 6.78s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 571/17840 [58:02<32:30:12, 6.78s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2553, 'learning_rate': 5.68e-05, 'epoch': 0.64} + 3%|██▍ | 571/17840 [58:02<32:30:12, 6.78s/it]g-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:24,598 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:24,598 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3387, 'learning_rate': 5.69e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:24,598 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:24,598 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:37:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 573/17840 [58:15<31:59:03, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:39:32,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 573/17840 [58:15<31:59:03, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:39:32,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:36,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:32,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 574/17840 [58:22<31:45:02, 6.62s/it]g-point operations will not be computed-17 17:39:32,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 574/17840 [58:22<31:45:02, 6.62s/it]g-point operations will not be computed-17 17:39:32,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1368, 'learning_rate': 5.71e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-17 17:39:42,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:32,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 575/17840 [58:31<35:07:02, 7.32s/it]g-point operations will not be computed-17 17:39:32,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 575/17840 [58:31<35:07:02, 7.32s/it]g-point operations will not be computed-17 17:39:32,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5257, 'learning_rate': 5.72e-05, 'epoch': 0.64} + 3%|██▍ | 575/17840 [58:31<35:07:02, 7.32s/it]g-point operations will not be computed-17 17:39:32,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 575/17840 [58:31<35:07:02, 7.32s/it]g-point operations will not be computed-17 17:39:32,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 575/17840 [58:31<35:07:02, 7.32s/it]g-point operations will not be computed-17 17:39:32,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 576/17840 [58:37<33:55:29, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 576/17840 [58:37<33:55:29, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 576/17840 [58:37<33:55:29, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 577/17840 [58:44<33:05:11, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 577/17840 [58:44<33:05:11, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:02,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:02,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 578/17840 [58:50<32:19:50, 6.74s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 578/17840 [58:50<32:19:50, 6.74s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4337, 'learning_rate': 5.7499999999999995e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:10,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 579/17840 [58:56<31:44:08, 6.62s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 579/17840 [58:56<31:44:08, 6.62s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9452, 'learning_rate': 5.76e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:17,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 580/17840 [59:03<31:14:42, 6.52s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 580/17840 [59:03<31:14:42, 6.52s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5149, 'learning_rate': 5.77e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:23,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 581/17840 [59:09<30:53:19, 6.44s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 581/17840 [59:09<30:53:19, 6.44s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.402, 'learning_rate': 5.7799999999999995e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:29,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 582/17840 [59:15<30:27:33, 6.35s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 582/17840 [59:15<30:27:33, 6.35s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1687, 'learning_rate': 5.79e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:35,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 583/17840 [59:21<30:01:49, 6.26s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 583/17840 [59:21<30:01:49, 6.26s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3502, 'learning_rate': 5.8e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:41,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 584/17840 [59:27<29:26:12, 6.14s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 584/17840 [59:27<29:26:12, 6.14s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:45,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:45,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:45,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 585/17840 [59:33<28:52:13, 6.02s/it]g-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:51,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:51,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:51,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:39:54,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 586/17840 [59:38<28:27:16, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 586/17840 [59:38<28:27:16, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 586/17840 [59:38<28:27:16, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:59,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:40:59,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:04,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:04,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 588/17840 [59:49<27:22:19, 5.71s/it]g-point operations will not be computed-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:08,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:10,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:10,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2097, 'learning_rate': 5.86e-05, 'epoch': 0.66} +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:10,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:10,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:15,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:18,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:18,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:18,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:40:55,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 591/17840 [1:00:05<25:26:00, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:24,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:24,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 592/17840 [1:00:10<24:32:42, 5.12s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:27,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:27,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:29,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:32,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:32,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:34,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:36,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:36,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:37,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:39,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:39,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:42,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:42,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:44,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:46,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:46,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:49,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:49,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:50,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:53,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2977, 'learning_rate': 5.97e-05, 'epoch': 0.67} +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:57,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:41:57,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:00,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:00,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4026, 'learning_rate': 5.9800000000000003e-05, 'epoch': 0.67} +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:04,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:04,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:04,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 602/17840 [1:00:53<26:41:06, 5.57s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 602/17840 [1:00:53<26:41:06, 5.57s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 602/17840 [1:00:53<26:41:06, 5.57s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 602/17840 [1:00:53<26:41:06, 5.57s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 602/17840 [1:00:53<26:41:06, 5.57s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 603/17840 [1:01:00<29:26:36, 6.15s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:19,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:19,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [1:01:07<31:13:03, 6.52s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [1:01:07<31:13:03, 6.52s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3304, 'learning_rate': 6.0100000000000004e-05, 'epoch': 0.68} + 3%|██▌ | 604/17840 [1:01:07<31:13:03, 6.52s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [1:01:07<31:13:03, 6.52s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [1:01:07<31:13:03, 6.52s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 605/17840 [1:01:15<32:22:38, 6.76s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 605/17840 [1:01:15<32:22:38, 6.76s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 605/17840 [1:01:15<32:22:38, 6.76s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:37,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:37,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.277, 'learning_rate': 6.03e-05, 'epoch': 0.68} +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:37,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:37,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:37,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 607/17840 [1:01:29<33:30:06, 7.00s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 607/17840 [1:01:29<33:30:06, 7.00s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 607/17840 [1:01:29<33:30:06, 7.00s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:52,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:52,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3776, 'learning_rate': 6.05e-05, 'epoch': 0.68} +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:52,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:42:52,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 609/17840 [1:01:43<33:49:13, 7.07s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 609/17840 [1:01:43<33:49:13, 7.07s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2486, 'learning_rate': 6.06e-05, 'epoch': 0.68} + 3%|██▌ | 609/17840 [1:01:43<33:49:13, 7.07s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:06,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:06,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3759, 'learning_rate': 6.07e-05, 'epoch': 0.68} +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:06,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:06,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:06,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 611/17840 [1:01:58<33:45:08, 7.05s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 611/17840 [1:01:58<33:45:08, 7.05s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:18,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 612/17840 [1:02:05<33:37:07, 7.03s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 612/17840 [1:02:05<33:37:07, 7.03s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4961, 'learning_rate': 6.09e-05, 'epoch': 0.69} + 3%|██▌ | 612/17840 [1:02:05<33:37:07, 7.03s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 612/17840 [1:02:05<33:37:07, 7.03s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 612/17840 [1:02:05<33:37:07, 7.03s/it]g-point operations will not be computed-17 17:41:22,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [1:02:11<33:28:54, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [1:02:11<33:28:54, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [1:02:11<33:28:54, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 614/17840 [1:02:18<33:11:41, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 614/17840 [1:02:18<33:11:41, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5273, 'learning_rate': 6.110000000000001e-05, 'epoch': 0.69} + 3%|██▌ | 614/17840 [1:02:18<33:11:41, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:41,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:41,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2826, 'learning_rate': 6.12e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:41,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:41,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:41,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 616/17840 [1:02:32<32:58:37, 6.89s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:51,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:51,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 617/17840 [1:02:39<32:49:24, 6.86s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 617/17840 [1:02:39<32:49:24, 6.86s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2531, 'learning_rate': 6.14e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-17 17:43:59,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 618/17840 [1:02:45<32:36:01, 6.81s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 618/17840 [1:02:45<32:36:01, 6.81s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1884, 'learning_rate': 6.15e-05, 'epoch': 0.69} + 3%|██▌ | 618/17840 [1:02:45<32:36:01, 6.81s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:08,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:08,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2256, 'learning_rate': 6.16e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:08,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:08,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 620/17840 [1:02:59<32:21:04, 6.76s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 620/17840 [1:02:59<32:21:04, 6.76s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:18,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:18,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 621/17840 [1:03:05<32:07:39, 6.72s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 621/17840 [1:03:05<32:07:39, 6.72s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3505, 'learning_rate': 6.18e-05, 'epoch': 0.7} + 3%|██▌ | 621/17840 [1:03:05<32:07:39, 6.72s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:28,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:28,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1937, 'learning_rate': 6.19e-05, 'epoch': 0.7} +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:28,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:34,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:34,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:34,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4754, 'learning_rate': 6.2e-05, 'epoch': 0.7} +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:34,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 624/17840 [1:03:25<31:45:00, 6.64s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 624/17840 [1:03:25<31:45:00, 6.64s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:44,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:44,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 625/17840 [1:03:34<34:54:35, 7.30s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 625/17840 [1:03:34<34:54:35, 7.30s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6064, 'learning_rate': 6.220000000000001e-05, 'epoch': 0.7} + 4%|██▌ | 625/17840 [1:03:34<34:54:35, 7.30s/it]g-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:56,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:56,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4407, 'learning_rate': 6.23e-05, 'epoch': 0.7} +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:56,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:56,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:44:56,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:43:29,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 627/17840 [1:03:47<32:56:07, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:04,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 627/17840 [1:03:47<32:56:07, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:04,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 627/17840 [1:03:47<32:56:07, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:04,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 628/17840 [1:03:54<32:14:50, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 628/17840 [1:03:54<32:14:50, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2603, 'learning_rate': 6.25e-05, 'epoch': 0.7} + 4%|██▌ | 628/17840 [1:03:54<32:14:50, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 628/17840 [1:03:54<32:14:50, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 629/17840 [1:04:00<31:48:32, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:19,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:19,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:19,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 630/17840 [1:04:06<31:23:49, 6.57s/it]g-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:25,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:25,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:25,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 631/17840 [1:04:13<31:04:35, 6.50s/it]g-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 631/17840 [1:04:13<31:04:35, 6.50s/it]g-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:33,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:33,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 632/17840 [1:04:19<30:36:38, 6.40s/it]g-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 632/17840 [1:04:19<30:36:38, 6.40s/it]g-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:39,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:39,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 633/17840 [1:04:25<30:13:08, 6.32s/it]g-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 633/17840 [1:04:25<30:13:08, 6.32s/it]g-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:45,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:45,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 634/17840 [1:04:31<29:49:42, 6.24s/it]g-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 634/17840 [1:04:31<29:49:42, 6.24s/it]g-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:51,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:51,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 635/17840 [1:04:37<29:21:11, 6.14s/it]g-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:55,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:55,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:45:55,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:45:11,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 636/17840 [1:04:43<28:52:50, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 636/17840 [1:04:43<28:52:50, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:04,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:04,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4019, 'learning_rate': 6.340000000000001e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:04,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:10,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:10,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.196, 'learning_rate': 6.35e-05, 'epoch': 0.72} +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:14,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:14,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 639/17840 [1:05:00<27:20:55, 5.72s/it]g-point operations will not be computed-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:18,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:20,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:20,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.32, 'learning_rate': 6.37e-05, 'epoch': 0.72} +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:24,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:24,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:00,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 641/17840 [1:05:10<25:48:14, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 641/17840 [1:05:10<25:48:14, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:30,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:30,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:32,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:34,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:34,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:36,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:38,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:38,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:40,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:42,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:42,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:44,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:44,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:45,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:48,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:48,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:50,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:50,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:53,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:53,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:55,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:55,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:55,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:58,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:46:58,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:02,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:02,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:02,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:06,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:06,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:06,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:06,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:06,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 652/17840 [1:05:58<27:09:10, 5.69s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:17,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:17,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:06:05<29:39:55, 6.21s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:06:05<29:39:55, 6.21s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.435, 'learning_rate': 6.500000000000001e-05, 'epoch': 0.73} + 4%|██▋ | 653/17840 [1:06:05<29:39:55, 6.21s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:06:05<29:39:55, 6.21s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:06:05<29:39:55, 6.21s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 654/17840 [1:06:13<31:22:04, 6.57s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 654/17840 [1:06:13<31:22:04, 6.57s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 654/17840 [1:06:13<31:22:04, 6.57s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:36,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:36,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3698, 'learning_rate': 6.52e-05, 'epoch': 0.73} +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:36,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:36,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 656/17840 [1:06:28<33:11:59, 6.96s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 656/17840 [1:06:28<33:11:59, 6.96s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2575, 'learning_rate': 6.53e-05, 'epoch': 0.74} + 4%|██▋ | 656/17840 [1:06:28<33:11:59, 6.96s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 656/17840 [1:06:28<33:11:59, 6.96s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 656/17840 [1:06:28<33:11:59, 6.96s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 657/17840 [1:06:35<33:37:45, 7.05s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 657/17840 [1:06:35<33:37:45, 7.05s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:47:56,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 658/17840 [1:06:42<33:55:27, 7.11s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 658/17840 [1:06:42<33:55:27, 7.11s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5128, 'learning_rate': 6.55e-05, 'epoch': 0.74} + 4%|██▋ | 658/17840 [1:06:42<33:55:27, 7.11s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 658/17840 [1:06:42<33:55:27, 7.11s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 659/17840 [1:06:49<34:02:46, 7.13s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 659/17840 [1:06:49<34:02:46, 7.13s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:08,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:08,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 660/17840 [1:06:57<34:12:12, 7.17s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 660/17840 [1:06:57<34:12:12, 7.17s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4801, 'learning_rate': 6.570000000000001e-05, 'epoch': 0.74} + 4%|██▋ | 660/17840 [1:06:57<34:12:12, 7.17s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 660/17840 [1:06:57<34:12:12, 7.17s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 661/17840 [1:07:04<34:05:16, 7.14s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 661/17840 [1:07:04<34:05:16, 7.14s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1625, 'learning_rate': 6.58e-05, 'epoch': 0.74} +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:24,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:07:11<33:54:23, 7.11s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:07:11<33:54:23, 7.11s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1942, 'learning_rate': 6.59e-05, 'epoch': 0.74} + 4%|██▋ | 662/17840 [1:07:11<33:54:23, 7.11s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:07:11<33:54:23, 7.11s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:07:11<33:54:23, 7.11s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 663/17840 [1:07:18<33:46:05, 7.08s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:37,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:37,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 664/17840 [1:07:25<33:30:35, 7.02s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 664/17840 [1:07:25<33:30:35, 7.02s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2197, 'learning_rate': 6.610000000000001e-05, 'epoch': 0.74} + 4%|██▊ | 664/17840 [1:07:25<33:30:35, 7.02s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:47,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:47,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.208, 'learning_rate': 6.620000000000001e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:47,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:47,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 666/17840 [1:07:38<33:08:34, 6.95s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 666/17840 [1:07:38<33:08:34, 6.95s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:57,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:48:57,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 667/17840 [1:07:45<33:02:48, 6.93s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 667/17840 [1:07:45<33:02:48, 6.93s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1885, 'learning_rate': 6.64e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:06,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 668/17840 [1:07:52<32:52:30, 6.89s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 668/17840 [1:07:52<32:52:30, 6.89s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3868, 'learning_rate': 6.65e-05, 'epoch': 0.75} + 4%|██▊ | 668/17840 [1:07:52<32:52:30, 6.89s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 668/17840 [1:07:52<32:52:30, 6.89s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 669/17840 [1:07:59<32:40:35, 6.85s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 669/17840 [1:07:59<32:40:35, 6.85s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:18,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:18,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 670/17840 [1:08:05<32:25:54, 6.80s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 670/17840 [1:08:05<32:25:54, 6.80s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4249, 'learning_rate': 6.670000000000001e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:26,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 671/17840 [1:08:12<32:13:41, 6.76s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 671/17840 [1:08:12<32:13:41, 6.76s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2524, 'learning_rate': 6.680000000000001e-05, 'epoch': 0.75} + 4%|██▊ | 671/17840 [1:08:12<32:13:41, 6.76s/it]g-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:34,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:34,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1729, 'learning_rate': 6.690000000000001e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:34,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:34,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:46:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 673/17840 [1:08:25<31:48:32, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 673/17840 [1:08:25<31:48:32, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2125, 'learning_rate': 6.7e-05, 'epoch': 0.75} + 4%|██▊ | 673/17840 [1:08:25<31:48:32, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 674/17840 [1:08:32<31:37:08, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 674/17840 [1:08:32<31:37:08, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.292, 'learning_rate': 6.71e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:52,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:49:52,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 675/17840 [1:08:41<34:43:15, 7.28s/it]g-point operations will not be computed-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 675/17840 [1:08:41<34:43:15, 7.28s/it]g-point operations will not be computed-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 675/17840 [1:08:41<34:43:15, 7.28s/it]g-point operations will not be computed-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 675/17840 [1:08:41<34:43:15, 7.28s/it]g-point operations will not be computed-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:03,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:03,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:03,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:09,478 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:09,478 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1961, 'learning_rate': 6.740000000000001e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:09,478 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:09,478 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:49:42,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 678/17840 [1:09:00<31:59:55, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:17,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 678/17840 [1:09:00<31:59:55, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:17,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0405, 'learning_rate': 6.750000000000001e-05, 'epoch': 0.76} + 4%|██▊ | 678/17840 [1:09:00<31:59:55, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:17,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 678/17840 [1:09:00<31:59:55, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:17,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 679/17840 [1:09:06<31:21:35, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:23,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 679/17840 [1:09:06<31:21:35, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:23,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 679/17840 [1:09:06<31:21:35, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:23,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 679/17840 [1:09:06<31:21:35, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:23,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 680/17840 [1:09:12<30:49:31, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 680/17840 [1:09:12<30:49:31, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 680/17840 [1:09:12<30:49:31, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 680/17840 [1:09:12<30:49:31, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 681/17840 [1:09:19<30:24:56, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:37,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:37,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:37,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:09:25<30:02:15, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:42,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:09:25<30:02:15, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:42,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:09:25<30:02:15, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:42,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:09:25<30:02:15, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:42,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 683/17840 [1:09:31<29:43:07, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 683/17840 [1:09:31<29:43:07, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:50:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:52,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:52,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4644, 'learning_rate': 6.81e-05, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:52,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:58,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:50:58,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5392, 'learning_rate': 6.82e-05, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:02,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:02,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 686/17840 [1:09:48<28:23:49, 5.96s/it]g-point operations will not be computed-17 17:50:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 686/17840 [1:09:48<28:23:49, 5.96s/it]g-point operations will not be computed-17 17:50:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:08,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:08,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:50:48,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 687/17840 [1:09:54<27:55:20, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:11,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 687/17840 [1:09:54<27:55:20, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:11,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:15,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:11,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:15,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:11,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.45, 'learning_rate': 6.850000000000001e-05, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:15,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:11,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:20,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:11,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:20,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:11,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5325, 'learning_rate': 6.860000000000001e-05, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:24,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:11,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:24,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:11,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 690/17840 [1:10:10<26:17:34, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:27,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 690/17840 [1:10:10<26:17:34, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:27,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:31,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:27,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:31,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:27,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2887, 'learning_rate': 6.879999999999999e-05, 'epoch': 0.77} + 4%|██▊ | 692/17840 [1:10:20<24:39:56, 5.18s/it]g-point operations will not be computed-17 17:51:27,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 692/17840 [1:10:20<24:39:56, 5.18s/it]g-point operations will not be computed-17 17:51:27,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 692/17840 [1:10:20<24:39:56, 5.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:36,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:39,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:36,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:39,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:36,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 693/17840 [1:10:24<23:26:33, 4.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:41,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:43,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:41,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:43,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:41,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 694/17840 [1:10:28<22:01:32, 4.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:44,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 695/17840 [1:10:32<20:33:29, 4.32s/it]g-point operations will not be computed-17 17:51:44,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 695/17840 [1:10:32<20:33:29, 4.32s/it]g-point operations will not be computed-17 17:51:44,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 695/17840 [1:10:32<20:33:29, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:48,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 696/17840 [1:10:35<19:06:23, 4.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:51,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 696/17840 [1:10:35<19:06:23, 4.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:51,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 697/17840 [1:10:38<17:42:17, 3.72s/it]g-point operations will not be computed-17 17:51:51,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 697/17840 [1:10:38<17:42:17, 3.72s/it]g-point operations will not be computed-17 17:51:51,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:55,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:54,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:51:55,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:54,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 698/17840 [1:10:41<16:10:53, 3.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:57,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 699/17840 [1:10:43<14:43:26, 3.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:59,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 699/17840 [1:10:43<14:43:26, 3.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:51:59,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:52:00,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:51:59,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 700/17840 [1:10:47<15:58:29, 3.36s/it]g-point operations will not be computed-17 17:51:59,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 700/17840 [1:10:47<15:58:29, 3.36s/it]g-point operations will not be computed-17 17:51:59,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 700/17840 [1:10:47<15:58:29, 3.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:05,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 700/17840 [1:10:47<15:58:29, 3.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:05,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:52:08,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:05,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 701/17840 [1:10:55<22:17:33, 4.68s/it]g-point operations will not be computed-17 17:52:05,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 701/17840 [1:10:55<22:17:33, 4.68s/it]g-point operations will not be computed-17 17:52:05,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 701/17840 [1:10:55<22:17:33, 4.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:12,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 701/17840 [1:10:55<22:17:33, 4.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:12,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 701/17840 [1:10:55<22:17:33, 4.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:12,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 701/17840 [1:10:55<22:17:33, 4.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:12,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 702/17840 [1:11:02<26:20:20, 5.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:20,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 702/17840 [1:11:02<26:20:20, 5.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:20,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 702/17840 [1:11:02<26:20:20, 5.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:20,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:11:10<28:56:37, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:20,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:11:10<28:56:37, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:20,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2308, 'learning_rate': 7e-05, 'epoch': 0.79} + 4%|██▉ | 703/17840 [1:11:10<28:56:37, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:20,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:11:10<28:56:37, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:20,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:11:10<28:56:37, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:20,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:11:17<30:39:32, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:11:17<30:39:32, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:11:17<30:39:32, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 705/17840 [1:11:24<31:55:57, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 705/17840 [1:11:24<31:55:57, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4654, 'learning_rate': 7.02e-05, 'epoch': 0.79} + 4%|██▉ | 705/17840 [1:11:24<31:55:57, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 705/17840 [1:11:24<31:55:57, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 706/17840 [1:11:31<32:33:50, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 706/17840 [1:11:31<32:33:50, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6859, 'learning_rate': 7.03e-05, 'epoch': 0.79} +[WARNING|modeling_utils.py:388] 2022-03-17 17:52:52,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 707/17840 [1:11:39<33:09:06, 6.97s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 707/17840 [1:11:39<33:09:06, 6.97s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5938, 'learning_rate': 7.04e-05, 'epoch': 0.79} + 4%|██▉ | 707/17840 [1:11:39<33:09:06, 6.97s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 707/17840 [1:11:39<33:09:06, 6.97s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 708/17840 [1:11:46<33:32:08, 7.05s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 708/17840 [1:11:46<33:32:08, 7.05s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.485, 'learning_rate': 7.05e-05, 'epoch': 0.79} +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:07,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 709/17840 [1:11:53<33:39:12, 7.07s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 709/17840 [1:11:53<33:39:12, 7.07s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4172, 'learning_rate': 7.06e-05, 'epoch': 0.79} + 4%|██▉ | 709/17840 [1:11:53<33:39:12, 7.07s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 709/17840 [1:11:53<33:39:12, 7.07s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 710/17840 [1:12:00<33:46:43, 7.10s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 710/17840 [1:12:00<33:46:43, 7.10s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:19,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:19,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 711/17840 [1:12:07<33:35:42, 7.06s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 711/17840 [1:12:07<33:35:42, 7.06s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2336, 'learning_rate': 7.08e-05, 'epoch': 0.8} + 4%|██▉ | 711/17840 [1:12:07<33:35:42, 7.06s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 711/17840 [1:12:07<33:35:42, 7.06s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 712/17840 [1:12:14<33:30:51, 7.04s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 712/17840 [1:12:14<33:30:51, 7.04s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:33,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:33,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 713/17840 [1:12:21<33:30:28, 7.04s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 713/17840 [1:12:21<33:30:28, 7.04s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2831, 'learning_rate': 7.1e-05, 'epoch': 0.8} + 4%|██▉ | 713/17840 [1:12:21<33:30:28, 7.04s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:44,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:44,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5154, 'learning_rate': 7.11e-05, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:44,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:44,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 715/17840 [1:12:35<33:14:04, 6.99s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 715/17840 [1:12:35<33:14:04, 6.99s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5476, 'learning_rate': 7.12e-05, 'epoch': 0.8} + 4%|██▉ | 715/17840 [1:12:35<33:14:04, 6.99s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 715/17840 [1:12:35<33:14:04, 6.99s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:57,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:57,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:57,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:53:57,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 717/17840 [1:12:49<32:53:57, 6.92s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 717/17840 [1:12:49<32:53:57, 6.92s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:08,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:08,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 718/17840 [1:12:56<32:43:00, 6.88s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 718/17840 [1:12:56<32:43:00, 6.88s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2215, 'learning_rate': 7.15e-05, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:16,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 719/17840 [1:13:02<32:25:02, 6.82s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 719/17840 [1:13:02<32:25:02, 6.82s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1022, 'learning_rate': 7.16e-05, 'epoch': 0.81} + 4%|██▉ | 719/17840 [1:13:02<32:25:02, 6.82s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:24,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:24,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3257, 'learning_rate': 7.17e-05, 'epoch': 0.81} +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:24,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:24,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 721/17840 [1:13:16<32:06:25, 6.75s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 721/17840 [1:13:16<32:06:25, 6.75s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:34,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:34,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:34,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 722/17840 [1:13:22<31:56:21, 6.72s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 722/17840 [1:13:22<31:56:21, 6.72s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 722/17840 [1:13:22<31:56:21, 6.72s/it]g-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:44,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:44,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4158, 'learning_rate': 7.2e-05, 'epoch': 0.81} +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:44,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:44,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:54:44,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:52:34,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 724/17840 [1:13:35<31:36:10, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 724/17840 [1:13:35<31:36:10, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 724/17840 [1:13:35<31:36:10, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 725/17840 [1:13:44<34:47:01, 7.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 725/17840 [1:13:44<34:47:01, 7.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2668, 'learning_rate': 7.22e-05, 'epoch': 0.81} +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:05,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 726/17840 [1:13:51<33:51:13, 7.12s/it]g-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 726/17840 [1:13:51<33:51:13, 7.12s/it]g-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6233, 'learning_rate': 7.23e-05, 'epoch': 0.81} +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:11,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 727/17840 [1:13:57<32:53:16, 6.92s/it]g-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 727/17840 [1:13:57<32:53:16, 6.92s/it]g-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2839, 'learning_rate': 7.24e-05, 'epoch': 0.82} + 4%|███ | 727/17840 [1:13:57<32:53:16, 6.92s/it]g-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 727/17840 [1:13:57<32:53:16, 6.92s/it]g-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:19,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:19,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:19,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:19,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:26,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:26,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:26,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:32,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:32,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3965, 'learning_rate': 7.27e-05, 'epoch': 0.82} +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:32,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:38,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:38,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6112, 'learning_rate': 7.280000000000001e-05, 'epoch': 0.82} +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:38,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:44,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:44,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3315, 'learning_rate': 7.29e-05, 'epoch': 0.82} +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:44,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:44,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:44,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:54:53,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 733/17840 [1:14:35<29:41:46, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:55:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:55:55,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 734/17840 [1:14:41<29:09:11, 6.14s/it]g-point operations will not be computed-17 17:55:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 734/17840 [1:14:41<29:09:11, 6.14s/it]g-point operations will not be computed-17 17:55:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5456, 'learning_rate': 7.31e-05, 'epoch': 0.82} +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:00,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:00,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 735/17840 [1:14:46<28:32:00, 6.01s/it]g-point operations will not be computed-17 17:55:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 735/17840 [1:14:46<28:32:00, 6.01s/it]g-point operations will not be computed-17 17:55:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:06,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:06,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 736/17840 [1:14:52<27:56:30, 5.88s/it]g-point operations will not be computed-17 17:55:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:10,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:10,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:10,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:55:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 737/17840 [1:14:57<27:26:53, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:56:14,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:17,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:14,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:17,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:14,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 738/17840 [1:15:03<26:48:43, 5.64s/it]g-point operations will not be computed-17 17:56:14,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:21,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:14,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:21,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:14,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:21,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:14,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 739/17840 [1:15:08<26:02:37, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:56:25,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:27,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:25,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:27,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:25,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 740/17840 [1:15:13<25:17:28, 5.32s/it]g-point operations will not be computed-17 17:56:25,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:31,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:25,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:33,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:25,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:33,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:25,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.77, 'learning_rate': 7.38e-05, 'epoch': 0.83} +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:37,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:25,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:37,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:25,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 742/17840 [1:15:22<23:42:03, 4.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:56:39,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:41,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:39,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:41,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:39,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 743/17840 [1:15:27<22:56:21, 4.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:56:43,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:45,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:43,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:45,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:43,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 744/17840 [1:15:31<21:58:28, 4.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:56:47,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:49,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:47,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:49,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:47,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 745/17840 [1:15:35<20:49:40, 4.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:56:51,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:53,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:51,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:53,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:51,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:56,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:54,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:56:56,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:56:54,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 747/17840 [1:15:41<17:53:47, 3.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:56:57,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 748/17840 [1:15:44<16:14:41, 3.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:57:00,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 748/17840 [1:15:44<16:14:41, 3.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:57:00,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 749/17840 [1:15:46<14:41:12, 3.09s/it]g-point operations will not be computed-17 17:57:00,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 749/17840 [1:15:46<14:41:12, 3.09s/it]g-point operations will not be computed-17 17:57:00,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:03,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:02,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:03,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:02,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 750/17840 [1:15:50<16:07:38, 3.40s/it]g-point operations will not be computed-17 17:57:02,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 750/17840 [1:15:50<16:07:38, 3.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:57:08,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:12,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:08,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 751/17840 [1:15:58<22:27:00, 4.73s/it]g-point operations will not be computed-17 17:57:08,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 751/17840 [1:15:58<22:27:00, 4.73s/it]g-point operations will not be computed-17 17:57:08,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 751/17840 [1:15:58<22:27:00, 4.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 751/17840 [1:15:58<22:27:00, 4.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:19,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:19,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:16:05<26:30:57, 5.59s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:16:05<26:30:57, 5.59s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:16:05<26:30:57, 5.59s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:16:05<26:30:57, 5.59s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:16:05<26:30:57, 5.59s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:16:13<29:11:18, 6.15s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:16:13<29:11:18, 6.15s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:34,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 754/17840 [1:16:20<30:54:56, 6.51s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 754/17840 [1:16:20<30:54:56, 6.51s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.525, 'learning_rate': 7.510000000000001e-05, 'epoch': 0.85} + 4%|███▏ | 754/17840 [1:16:20<30:54:56, 6.51s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 754/17840 [1:16:20<30:54:56, 6.51s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 754/17840 [1:16:20<30:54:56, 6.51s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 755/17840 [1:16:28<31:59:09, 6.74s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 755/17840 [1:16:28<31:59:09, 6.74s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 755/17840 [1:16:28<31:59:09, 6.74s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:50,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:50,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4238, 'learning_rate': 7.53e-05, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:50,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:57:50,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:16:42<33:16:09, 7.01s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:16:42<33:16:09, 7.01s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3923, 'learning_rate': 7.54e-05, 'epoch': 0.85} + 4%|███▏ | 757/17840 [1:16:42<33:16:09, 7.01s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:05,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:05,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4121, 'learning_rate': 7.55e-05, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:05,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:05,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 759/17840 [1:16:56<33:34:49, 7.08s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 759/17840 [1:16:56<33:34:49, 7.08s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2518, 'learning_rate': 7.560000000000001e-05, 'epoch': 0.85} + 4%|███▏ | 759/17840 [1:16:56<33:34:49, 7.08s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3593, 'learning_rate': 7.570000000000001e-05, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:19,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 761/17840 [1:17:11<33:30:34, 7.06s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 761/17840 [1:17:11<33:30:34, 7.06s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:58:31,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 762/17840 [1:17:18<33:25:50, 7.05s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 762/17840 [1:17:18<33:25:50, 7.05s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4069, 'learning_rate': 7.59e-05, 'epoch': 0.85} + 4%|███▏ | 762/17840 [1:17:18<33:25:50, 7.05s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 762/17840 [1:17:18<33:25:50, 7.05s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 762/17840 [1:17:18<33:25:50, 7.05s/it]g-point operations will not be computed-17 17:57:15,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 763/17840 [1:17:25<33:16:36, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:58:42,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 763/17840 [1:17:25<33:16:36, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:58:42,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 763/17840 [1:17:25<33:16:36, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:58:42,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 764/17840 [1:17:31<33:09:44, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:58:42,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 764/17840 [1:17:31<33:09:44, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:58:42,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2331, 'learning_rate': 7.61e-05, 'epoch': 0.86} + 4%|███▏ | 764/17840 [1:17:31<33:09:44, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:58:42,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 764/17840 [1:17:31<33:09:44, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:58:42,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 764/17840 [1:17:31<33:09:44, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:58:42,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 765/17840 [1:17:38<33:06:05, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:58:56,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 765/17840 [1:17:38<33:06:05, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:58:56,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 765/17840 [1:17:38<33:06:05, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:58:56,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 766/17840 [1:17:45<33:04:20, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:58:56,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 766/17840 [1:17:45<33:04:20, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:58:56,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2336, 'learning_rate': 7.630000000000001e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:06,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:58:56,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 767/17840 [1:17:52<32:58:56, 6.95s/it]g-point operations will not be computed-17 17:58:56,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 767/17840 [1:17:52<32:58:56, 6.95s/it]g-point operations will not be computed-17 17:58:56,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2634, 'learning_rate': 7.64e-05, 'epoch': 0.86} + 4%|███▏ | 767/17840 [1:17:52<32:58:56, 6.95s/it]g-point operations will not be computed-17 17:58:56,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 767/17840 [1:17:52<32:58:56, 6.95s/it]g-point operations will not be computed-17 17:58:56,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 767/17840 [1:17:52<32:58:56, 6.95s/it]g-point operations will not be computed-17 17:58:56,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 768/17840 [1:17:59<32:44:23, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 768/17840 [1:17:59<32:44:23, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 768/17840 [1:17:59<32:44:23, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 769/17840 [1:18:06<32:33:49, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 769/17840 [1:18:06<32:33:49, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4303, 'learning_rate': 7.66e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:26,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 770/17840 [1:18:13<32:23:03, 6.83s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 770/17840 [1:18:13<32:23:03, 6.83s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5228, 'learning_rate': 7.670000000000001e-05, 'epoch': 0.86} + 4%|███▏ | 770/17840 [1:18:13<32:23:03, 6.83s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3153, 'learning_rate': 7.680000000000001e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 772/17840 [1:18:26<32:05:17, 6.77s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 772/17840 [1:18:26<32:05:17, 6.77s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5192, 'learning_rate': 7.69e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:47,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 773/17840 [1:18:33<32:00:36, 6.75s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 773/17840 [1:18:33<32:00:36, 6.75s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6207, 'learning_rate': 7.7e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-17 17:59:53,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 774/17840 [1:18:39<31:43:33, 6.69s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 774/17840 [1:18:39<31:43:33, 6.69s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.046, 'learning_rate': 7.71e-05, 'epoch': 0.87} + 4%|███▏ | 774/17840 [1:18:39<31:43:33, 6.69s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 774/17840 [1:18:39<31:43:33, 6.69s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 775/17840 [1:18:48<35:00:06, 7.38s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 775/17840 [1:18:48<35:00:06, 7.38s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:07,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:07,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 776/17840 [1:18:55<33:52:00, 7.14s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 776/17840 [1:18:55<33:52:00, 7.14s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:14,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:14,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 777/17840 [1:19:01<32:48:03, 6.92s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 777/17840 [1:19:01<32:48:03, 6.92s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2279, 'learning_rate': 7.740000000000001e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:22,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 778/17840 [1:19:08<32:03:38, 6.76s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 778/17840 [1:19:08<32:03:38, 6.76s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4905, 'learning_rate': 7.75e-05, 'epoch': 0.87} + 4%|███▏ | 778/17840 [1:19:08<32:03:38, 6.76s/it]g-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:29,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:29,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3758, 'learning_rate': 7.76e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:29,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:36,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:36,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2286, 'learning_rate': 7.77e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:36,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:42,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:42,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3139, 'learning_rate': 7.780000000000001e-05, 'epoch': 0.88} +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:42,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:42,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:00:42,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 17:59:16,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 782/17840 [1:19:33<30:06:21, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:00:50,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 782/17840 [1:19:33<30:06:21, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:00:50,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 782/17840 [1:19:33<30:06:21, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:00:50,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 782/17840 [1:19:33<30:06:21, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:00:50,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 783/17840 [1:19:39<29:39:33, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 783/17840 [1:19:39<29:39:33, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:00,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:00,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2292, 'learning_rate': 7.81e-05, 'epoch': 0.88} +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:00,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:00,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:06,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:06,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:10,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:10,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 786/17840 [1:19:56<28:32:55, 6.03s/it]g-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:15,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:15,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:15,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 787/17840 [1:20:02<27:56:29, 5.90s/it]g-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:20,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:20,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:20,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:00:56,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 788/17840 [1:20:08<27:23:52, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:24,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 788/17840 [1:20:08<27:23:52, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:24,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 788/17840 [1:20:08<27:23:52, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:24,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:28,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:24,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:28,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:24,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:32,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:24,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:32,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:24,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 790/17840 [1:20:18<26:02:07, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:35,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 790/17840 [1:20:18<26:02:07, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:35,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 790/17840 [1:20:18<26:02:07, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:35,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:38,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:35,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:41,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:35,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:43,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:35,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:01:43,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:01:35,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2843, 'learning_rate': 7.890000000000001e-05, 'epoch': 0.89} + 4%|███▎ | 793/17840 [1:20:32<23:26:23, 4.95s/it]g-point operations will not be computed-17 18:01:35,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 793/17840 [1:20:32<23:26:23, 4.95s/it]g-point operations will not be computed-17 18:01:35,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 793/17840 [1:20:32<23:26:23, 4.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:49,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 794/17840 [1:20:36<22:19:45, 4.72s/it]g-point operations will not be computed-17 18:01:49,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 794/17840 [1:20:36<22:19:45, 4.72s/it]g-point operations will not be computed-17 18:01:49,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 794/17840 [1:20:36<22:19:45, 4.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:53,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 795/17840 [1:20:40<20:57:54, 4.43s/it]g-point operations will not be computed-17 18:01:53,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 795/17840 [1:20:40<20:57:54, 4.43s/it]g-point operations will not be computed-17 18:01:53,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 795/17840 [1:20:40<20:57:54, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:57,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 795/17840 [1:20:40<20:57:54, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:01:57,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 796/17840 [1:20:43<19:30:49, 4.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:00,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 18:02:00,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 18:02:00,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:04,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:03,305 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 798/17840 [1:20:49<16:28:28, 3.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:05,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 798/17840 [1:20:49<16:28:28, 3.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:05,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 799/17840 [1:20:52<14:51:48, 3.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:08,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 799/17840 [1:20:52<14:51:48, 3.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:08,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:09,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:08,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 800/17840 [1:20:56<16:04:40, 3.40s/it]g-point operations will not be computed-17 18:02:08,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 800/17840 [1:20:56<16:04:40, 3.40s/it]g-point operations will not be computed-17 18:02:08,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 800/17840 [1:20:56<16:04:40, 3.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:14,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 800/17840 [1:20:56<16:04:40, 3.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:14,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:18,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:14,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 801/17840 [1:21:04<23:06:49, 4.88s/it]g-point operations will not be computed-17 18:02:14,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 801/17840 [1:21:04<23:06:49, 4.88s/it]g-point operations will not be computed-17 18:02:14,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 801/17840 [1:21:04<23:06:49, 4.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:21,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 801/17840 [1:21:04<23:06:49, 4.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:21,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 801/17840 [1:21:04<23:06:49, 4.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:21,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 801/17840 [1:21:04<23:06:49, 4.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:21,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 802/17840 [1:21:12<26:54:18, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:21,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 802/17840 [1:21:12<26:54:18, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:21,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 802/17840 [1:21:12<26:54:18, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:21,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 802/17840 [1:21:12<26:54:18, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:21,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 802/17840 [1:21:12<26:54:18, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:21,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 803/17840 [1:21:19<29:16:36, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 803/17840 [1:21:19<29:16:36, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 803/17840 [1:21:19<29:16:36, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:21:26<30:48:44, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:21:26<30:48:44, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4142, 'learning_rate': 8.010000000000001e-05, 'epoch': 0.9} + 5%|███▎ | 804/17840 [1:21:26<30:48:44, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:21:26<30:48:44, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:21:26<30:48:44, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 805/17840 [1:21:34<32:00:31, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 805/17840 [1:21:34<32:00:31, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:02:54,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 806/17840 [1:21:41<32:45:52, 6.92s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 806/17840 [1:21:41<32:45:52, 6.92s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5287, 'learning_rate': 8.030000000000001e-05, 'epoch': 0.9} + 5%|███▎ | 806/17840 [1:21:41<32:45:52, 6.92s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 806/17840 [1:21:41<32:45:52, 6.92s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 806/17840 [1:21:41<32:45:52, 6.92s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 807/17840 [1:21:48<33:13:48, 7.02s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 807/17840 [1:21:48<33:13:48, 7.02s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 807/17840 [1:21:48<33:13:48, 7.02s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:11,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:11,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2525, 'learning_rate': 8.05e-05, 'epoch': 0.91} +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:11,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:11,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 809/17840 [1:22:02<33:34:28, 7.10s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 809/17840 [1:22:02<33:34:28, 7.10s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5585, 'learning_rate': 8.060000000000001e-05, 'epoch': 0.91} + 5%|███▎ | 809/17840 [1:22:02<33:34:28, 7.10s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:25,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:25,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2244, 'learning_rate': 8.070000000000001e-05, 'epoch': 0.91} +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:25,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:25,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 811/17840 [1:22:17<33:34:14, 7.10s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 811/17840 [1:22:17<33:34:14, 7.10s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5783, 'learning_rate': 8.080000000000001e-05, 'epoch': 0.91} +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:37,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 812/17840 [1:22:24<33:22:16, 7.06s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 812/17840 [1:22:24<33:22:16, 7.06s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5057, 'learning_rate': 8.090000000000001e-05, 'epoch': 0.91} + 5%|███▎ | 812/17840 [1:22:24<33:22:16, 7.06s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 812/17840 [1:22:24<33:22:16, 7.06s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 812/17840 [1:22:24<33:22:16, 7.06s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 813/17840 [1:22:31<33:13:45, 7.03s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 813/17840 [1:22:31<33:13:45, 7.03s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:03:51,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 814/17840 [1:22:37<33:03:53, 6.99s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 814/17840 [1:22:37<33:03:53, 6.99s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.307, 'learning_rate': 8.11e-05, 'epoch': 0.91} + 5%|███▍ | 814/17840 [1:22:37<33:03:53, 6.99s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:00,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:00,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:03,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:03,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 816/17840 [1:22:51<32:46:34, 6.93s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 816/17840 [1:22:51<32:46:34, 6.93s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2743, 'learning_rate': 8.13e-05, 'epoch': 0.91} + 5%|███▍ | 816/17840 [1:22:51<32:46:34, 6.93s/it]g-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:13,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:13,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4426, 'learning_rate': 8.14e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:13,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:13,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:13,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:02:36,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 818/17840 [1:23:05<32:20:36, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:22,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 818/17840 [1:23:05<32:20:36, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:22,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 818/17840 [1:23:05<32:20:36, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:22,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 819/17840 [1:23:11<32:12:07, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:22,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 819/17840 [1:23:11<32:12:07, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:22,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4366, 'learning_rate': 8.16e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:32,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:22,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 820/17840 [1:23:18<32:00:04, 6.77s/it]g-point operations will not be computed-17 18:04:22,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 820/17840 [1:23:18<32:00:04, 6.77s/it]g-point operations will not be computed-17 18:04:22,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3529, 'learning_rate': 8.17e-05, 'epoch': 0.92} + 5%|███▍ | 820/17840 [1:23:18<32:00:04, 6.77s/it]g-point operations will not be computed-17 18:04:22,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 820/17840 [1:23:18<32:00:04, 6.77s/it]g-point operations will not be computed-17 18:04:22,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 820/17840 [1:23:18<32:00:04, 6.77s/it]g-point operations will not be computed-17 18:04:22,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 821/17840 [1:23:25<31:52:31, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 821/17840 [1:23:25<31:52:31, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 821/17840 [1:23:25<31:52:31, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 821/17840 [1:23:25<31:52:31, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 822/17840 [1:23:31<31:40:46, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:50,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:50,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 823/17840 [1:23:38<31:21:51, 6.64s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 823/17840 [1:23:38<31:21:51, 6.64s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:57,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:04:57,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 824/17840 [1:23:44<31:13:10, 6.60s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 824/17840 [1:23:44<31:13:10, 6.60s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4422, 'learning_rate': 8.21e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:05,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 825/17840 [1:23:53<34:28:12, 7.29s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 825/17840 [1:23:53<34:28:12, 7.29s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5981, 'learning_rate': 8.22e-05, 'epoch': 0.92} + 5%|███▍ | 825/17840 [1:23:53<34:28:12, 7.29s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:15,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:15,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.444, 'learning_rate': 8.23e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:15,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:15,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:15,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 827/17840 [1:24:06<32:13:54, 6.82s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:25,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:25,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:25,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 828/17840 [1:24:12<31:25:20, 6.65s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:31,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:31,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 829/17840 [1:24:19<30:47:53, 6.52s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 829/17840 [1:24:19<30:47:53, 6.52s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:37,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:37,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 830/17840 [1:24:25<30:15:33, 6.40s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 830/17840 [1:24:25<30:15:33, 6.40s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:43,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:43,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 831/17840 [1:24:31<29:55:23, 6.33s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 831/17840 [1:24:31<29:55:23, 6.33s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:49,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:49,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 832/17840 [1:24:37<29:37:13, 6.27s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 832/17840 [1:24:37<29:37:13, 6.27s/it]g-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:55,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:05:55,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:04:42,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 833/17840 [1:24:43<29:16:04, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:00,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 833/17840 [1:24:43<29:16:04, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:00,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6132, 'learning_rate': 8.3e-05, 'epoch': 0.93} + 5%|███▍ | 833/17840 [1:24:43<29:16:04, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:00,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 833/17840 [1:24:43<29:16:04, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:00,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 834/17840 [1:24:49<28:48:45, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:06,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 834/17840 [1:24:49<28:48:45, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:06,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:10,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:06,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:10,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:06,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3315, 'learning_rate': 8.32e-05, 'epoch': 0.94} +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:10,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:06,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:06,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:06,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4178, 'learning_rate': 8.33e-05, 'epoch': 0.94} +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:20,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:06,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 837/17840 [1:25:06<27:11:25, 5.76s/it]g-point operations will not be computed-17 18:06:06,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 837/17840 [1:25:06<27:11:25, 5.76s/it]g-point operations will not be computed-17 18:06:06,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:24,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:06,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:24,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:06,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 838/17840 [1:25:11<26:38:57, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:28,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 838/17840 [1:25:11<26:38:57, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:28,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6985, 'learning_rate': 8.35e-05, 'epoch': 0.94} +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:32,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:28,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:32,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:28,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:34,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:28,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:34,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:28,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:34,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:28,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 840/17840 [1:25:21<25:00:06, 5.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:38,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:40,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:38,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 841/17840 [1:25:26<24:05:04, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 841/17840 [1:25:26<24:05:04, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6203, 'learning_rate': 8.38e-05, 'epoch': 0.94} +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:46,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:46,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:48,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:50,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:50,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:52,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:53,851 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:53,851 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:06:58,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:00,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:00,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:02,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:02,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:05,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:06,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:06,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:08,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:08,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:11,598 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:11,598 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4854, 'learning_rate': 8.47e-05, 'epoch': 0.95} +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:15,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:19,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:19,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5493, 'learning_rate': 8.48e-05, 'epoch': 0.95} +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:23,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:23,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:27,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:27,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4406, 'learning_rate': 8.49e-05, 'epoch': 0.96} +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:30,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:07:30,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 853/17840 [1:26:19<28:49:03, 6.11s/it]g-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 853/17840 [1:26:19<28:49:03, 6.11s/it]g-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7294, 'learning_rate': 8.5e-05, 'epoch': 0.96} + 5%|███▌ | 853/17840 [1:26:19<28:49:03, 6.11s/it]g-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 853/17840 [1:26:19<28:49:03, 6.11s/it]g-point operations will not be computed-17 18:06:42,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3116, 'learning_rate': 8.510000000000001e-05, 'epoch': 0.96} + 5%|███▌ | 854/17840 [1:26:26<30:35:19, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 854/17840 [1:26:26<30:35:19, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 854/17840 [1:26:26<30:35:19, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 854/17840 [1:26:26<30:35:19, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:26:33<31:52:18, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:26:33<31:52:18, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:26:33<31:52:18, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:26:33<31:52:18, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:26:33<31:52:18, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 856/17840 [1:26:41<32:37:35, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:00,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:00,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:00,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 857/17840 [1:26:48<33:04:20, 7.01s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 857/17840 [1:26:48<33:04:20, 7.01s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 857/17840 [1:26:48<33:04:20, 7.01s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 857/17840 [1:26:48<33:04:20, 7.01s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 857/17840 [1:26:48<33:04:20, 7.01s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 858/17840 [1:26:55<33:13:44, 7.04s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 858/17840 [1:26:55<33:13:44, 7.04s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:16,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:16,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 859/17840 [1:27:02<33:24:07, 7.08s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 859/17840 [1:27:02<33:24:07, 7.08s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 859/17840 [1:27:02<33:24:07, 7.08s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 859/17840 [1:27:02<33:24:07, 7.08s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 859/17840 [1:27:02<33:24:07, 7.08s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 860/17840 [1:27:09<33:22:40, 7.08s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:28,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:28,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:28,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 861/17840 [1:27:16<33:19:38, 7.07s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 861/17840 [1:27:16<33:19:38, 7.07s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 861/17840 [1:27:16<33:19:38, 7.07s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:39,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:39,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5303, 'learning_rate': 8.59e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:39,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:39,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:39,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 863/17840 [1:27:30<32:54:35, 6.98s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 863/17840 [1:27:30<32:54:35, 6.98s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:51,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 864/17840 [1:27:37<32:41:56, 6.93s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 864/17840 [1:27:37<32:41:56, 6.93s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0502, 'learning_rate': 8.61e-05, 'epoch': 0.97} + 5%|███▌ | 864/17840 [1:27:37<32:41:56, 6.93s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:59,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:59,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5061, 'learning_rate': 8.620000000000001e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:59,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:59,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:08:59,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 866/17840 [1:27:50<32:20:59, 6.86s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:09,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:09,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 867/17840 [1:27:57<32:07:40, 6.81s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 867/17840 [1:27:57<32:07:40, 6.81s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4683, 'learning_rate': 8.64e-05, 'epoch': 0.97} + 5%|███▌ | 867/17840 [1:27:57<32:07:40, 6.81s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 867/17840 [1:27:57<32:07:40, 6.81s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 867/17840 [1:27:57<32:07:40, 6.81s/it]g-point operations will not be computed-17 18:07:43,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 868/17840 [1:28:04<31:57:41, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 868/17840 [1:28:04<31:57:41, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 868/17840 [1:28:04<31:57:41, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 868/17840 [1:28:04<31:57:41, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 869/17840 [1:28:11<31:47:40, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:29,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:29,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:29,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 870/17840 [1:28:17<31:36:48, 6.71s/it]g-point operations will not be computed-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:36,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:36,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 871/17840 [1:28:24<31:23:26, 6.66s/it]g-point operations will not be computed-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 871/17840 [1:28:24<31:23:26, 6.66s/it]g-point operations will not be computed-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3591, 'learning_rate': 8.680000000000001e-05, 'epoch': 0.98} + 5%|███▌ | 871/17840 [1:28:24<31:23:26, 6.66s/it]g-point operations will not be computed-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:46,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:46,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.635, 'learning_rate': 8.69e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:46,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:46,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:09:46,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:09:21,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 873/17840 [1:28:37<30:57:17, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:09:54,326 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 873/17840 [1:28:37<30:57:17, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:09:54,326 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 873/17840 [1:28:37<30:57:17, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:09:54,326 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 873/17840 [1:28:37<30:57:17, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:09:54,326 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 874/17840 [1:28:43<30:41:09, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 874/17840 [1:28:43<30:41:09, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 874/17840 [1:28:43<30:41:09, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 875/17840 [1:28:52<33:56:39, 7.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 875/17840 [1:28:52<33:56:39, 7.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9058, 'learning_rate': 8.72e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:12,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 876/17840 [1:28:58<32:35:54, 6.92s/it]g-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 876/17840 [1:28:58<32:35:54, 6.92s/it]g-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4126, 'learning_rate': 8.730000000000001e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:18,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 877/17840 [1:29:04<31:23:46, 6.66s/it]g-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 877/17840 [1:29:04<31:23:46, 6.66s/it]g-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2949, 'learning_rate': 8.740000000000001e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:24,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 878/17840 [1:29:10<30:29:50, 6.47s/it]g-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 878/17840 [1:29:10<30:29:50, 6.47s/it]g-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3304, 'learning_rate': 8.75e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:30,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:30,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 879/17840 [1:29:16<29:45:05, 6.31s/it]g-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:35,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:35,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 880/17840 [1:29:22<29:02:02, 6.16s/it]g-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 880/17840 [1:29:22<29:02:02, 6.16s/it]g-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:40,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:40,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:40,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:00,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 881/17840 [1:29:28<28:12:30, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:10:45,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 881/17840 [1:29:28<28:12:30, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:10:45,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:49,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:45,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:49,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:45,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3737, 'learning_rate': 8.790000000000001e-05, 'epoch': 0.99} +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:52,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:45,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:52,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:45,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 883/17840 [1:29:38<26:32:56, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:10:55,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 883/17840 [1:29:38<26:32:56, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:10:55,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:59,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:55,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:10:59,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:55,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:01,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:55,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:03,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:55,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:03,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:55,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3527, 'learning_rate': 8.82e-05, 'epoch': 0.99} +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:06,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:55,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:06,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:10:55,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 886/17840 [1:29:52<23:07:30, 4.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:09,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:10,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:09,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:10,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:09,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 887/17840 [1:29:56<21:38:42, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:12,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 888/17840 [1:29:59<20:05:03, 4.27s/it]g-point operations will not be computed-17 18:11:12,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 888/17840 [1:29:59<20:05:03, 4.27s/it]g-point operations will not be computed-17 18:11:12,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:17,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:16,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:17,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:16,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 889/17840 [1:30:02<18:27:44, 3.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:19,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 890/17840 [1:30:05<16:49:03, 3.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:21,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 890/17840 [1:30:05<16:49:03, 3.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:21,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 891/17840 [1:30:08<15:09:02, 3.22s/it]g-point operations will not be computed-17 18:11:21,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 891/17840 [1:30:08<15:09:02, 3.22s/it]g-point operations will not be computed-17 18:11:21,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 892/17840 [1:30:10<13:25:14, 2.85s/it]g-point operations will not be computed-17 18:11:24,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 892/17840 [1:30:10<13:25:14, 2.85s/it]g-point operations will not be computed-17 18:11:24,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 892/17840 [1:30:10<13:25:14, 2.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:27,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 892/17840 [1:30:10<13:25:14, 2.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:27,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:31,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:27,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 893/17840 [1:30:18<20:51:04, 4.43s/it]g-point operations will not be computed-17 18:11:27,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 893/17840 [1:30:18<20:51:04, 4.43s/it]g-point operations will not be computed-17 18:11:27,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 893/17840 [1:30:18<20:51:04, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 893/17840 [1:30:18<20:51:04, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:39,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 894/17840 [1:30:26<25:35:38, 5.44s/it]g-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 894/17840 [1:30:26<25:35:38, 5.44s/it]g-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5055, 'learning_rate': 8.910000000000001e-05, 'epoch': 1.0} + 5%|███▋ | 894/17840 [1:30:26<25:35:38, 5.44s/it]g-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 894/17840 [1:30:26<25:35:38, 5.44s/it]g-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 895/17840 [1:30:33<28:30:36, 6.06s/it]g-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 895/17840 [1:30:33<28:30:36, 6.06s/it]g-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.319, 'learning_rate': 8.92e-05, 'epoch': 1.0} +[WARNING|modeling_utils.py:388] 2022-03-17 18:11:54,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 896/17840 [1:30:40<30:17:44, 6.44s/it]g-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 896/17840 [1:30:40<30:17:44, 6.44s/it]g-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1485, 'learning_rate': 8.93e-05, 'epoch': 1.0} + 5%|███▋ | 896/17840 [1:30:40<30:17:44, 6.44s/it]g-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 896/17840 [1:30:40<30:17:44, 6.44s/it]g-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 897/17840 [1:30:48<31:33:42, 6.71s/it]g-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 897/17840 [1:30:48<31:33:42, 6.71s/it]g-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1794, 'learning_rate': 8.94e-05, 'epoch': 1.01} + 5%|███▋ | 897/17840 [1:30:48<31:33:42, 6.71s/it]g-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 897/17840 [1:30:48<31:33:42, 6.71s/it]g-point operations will not be computed-17 18:11:35,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 898/17840 [1:30:55<32:31:02, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:12,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 898/17840 [1:30:55<32:31:02, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:12,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:12:16,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:12:12,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 899/17840 [1:31:02<32:59:27, 7.01s/it]g-point operations will not be computed-17 18:12:12,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 899/17840 [1:31:02<32:59:27, 7.01s/it]g-point operations will not be computed-17 18:12:12,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9793, 'learning_rate': 8.960000000000001e-05, 'epoch': 1.01} + 5%|███▋ | 899/17840 [1:31:02<32:59:27, 7.01s/it]g-point operations will not be computed-17 18:12:12,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 899/17840 [1:31:02<32:59:27, 7.01s/it]g-point operations will not be computed-17 18:12:12,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:31:12<36:34:23, 7.77s/it]g-point operations will not be computed-17 18:12:12,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:31:12<36:34:23, 7.77s/it]g-point operations will not be computed-17 18:12:12,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5082, 'learning_rate': 8.970000000000001e-05, 'epoch': 1.01} + 5%|███▋ | 900/17840 [1:31:12<36:34:23, 7.77s/it]g-point operations will not be computed-17 18:12:12,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:31:12<36:34:23, 7.77s/it]g-point operations will not be computed-17 18:12:12,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:31:19<35:45:57, 7.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:36,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:31:19<35:45:57, 7.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:36,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2142, 'learning_rate': 8.98e-05, 'epoch': 1.01} + 5%|███▋ | 901/17840 [1:31:19<35:45:57, 7.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:36,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 902/17840 [1:31:26<35:14:21, 7.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:36,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 902/17840 [1:31:26<35:14:21, 7.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:36,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3414, 'learning_rate': 8.99e-05, 'epoch': 1.01} + 5%|███▋ | 902/17840 [1:31:26<35:14:21, 7.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:36,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 902/17840 [1:31:26<35:14:21, 7.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:36,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 902/17840 [1:31:26<35:14:21, 7.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:36,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 903/17840 [1:31:33<34:37:16, 7.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 903/17840 [1:31:33<34:37:16, 7.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 903/17840 [1:31:33<34:37:16, 7.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 904/17840 [1:31:40<34:09:13, 7.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 904/17840 [1:31:40<34:09:13, 7.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2347, 'learning_rate': 9.010000000000001e-05, 'epoch': 1.01} + 5%|███▋ | 904/17840 [1:31:40<34:09:13, 7.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:03,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:03,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1, 'learning_rate': 9.020000000000001e-05, 'epoch': 1.01} +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:03,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:03,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 906/17840 [1:31:54<33:14:58, 7.07s/it]g-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 906/17840 [1:31:54<33:14:58, 7.07s/it]g-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:13,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:13,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 907/17840 [1:32:01<32:53:39, 6.99s/it]g-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 907/17840 [1:32:01<32:53:39, 6.99s/it]g-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2217, 'learning_rate': 9.04e-05, 'epoch': 1.02} + 5%|███▊ | 907/17840 [1:32:01<32:53:39, 6.99s/it]g-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:23,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:23,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2471, 'learning_rate': 9.05e-05, 'epoch': 1.02} +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:23,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:23,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:23,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:12:51,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 909/17840 [1:32:15<32:25:21, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:13:32,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 909/17840 [1:32:15<32:25:21, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:13:32,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 909/17840 [1:32:15<32:25:21, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:13:32,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 909/17840 [1:32:15<32:25:21, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:13:32,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 910/17840 [1:32:21<32:23:08, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:13:32,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 910/17840 [1:32:21<32:23:08, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:13:32,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 910/17840 [1:32:21<32:23:08, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:13:32,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 910/17840 [1:32:21<32:23:08, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:13:32,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:44,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:32,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:44,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:32,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:44,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:32,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:44,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:32,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:13:44,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:32,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 912/17840 [1:32:35<31:49:59, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 912/17840 [1:32:35<31:49:59, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 912/17840 [1:32:35<31:49:59, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 912/17840 [1:32:35<31:49:59, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 913/17840 [1:32:42<31:47:04, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 913/17840 [1:32:42<31:47:04, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:02,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:02,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 914/17840 [1:32:48<31:44:08, 6.75s/it]g-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 914/17840 [1:32:48<31:44:08, 6.75s/it]g-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 914/17840 [1:32:48<31:44:08, 6.75s/it]g-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:10,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:10,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8728, 'learning_rate': 9.120000000000001e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:10,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:17,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:17,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1234, 'learning_rate': 9.130000000000001e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:17,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:17,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:17,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 917/17840 [1:33:08<31:07:10, 6.62s/it]g-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:27,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:27,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:27,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 918/17840 [1:33:14<31:00:19, 6.60s/it]g-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:33,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:33,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:33,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 919/17840 [1:33:21<30:52:27, 6.57s/it]g-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 919/17840 [1:33:21<30:52:27, 6.57s/it]g-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:41,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:41,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 920/17840 [1:33:27<30:30:11, 6.49s/it]g-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 920/17840 [1:33:27<30:30:11, 6.49s/it]g-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 920/17840 [1:33:27<30:30:11, 6.49s/it]g-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:49,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:49,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8077, 'learning_rate': 9.180000000000001e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:49,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:55,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:55,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1857, 'learning_rate': 9.190000000000001e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-17 18:14:55,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:01,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:01,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2053, 'learning_rate': 9.200000000000001e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:01,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:08,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:08,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0103, 'learning_rate': 9.21e-05, 'epoch': 1.04} +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:08,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:08,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:08,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:08,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1649, 'learning_rate': 9.22e-05, 'epoch': 1.04} +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:08,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:22,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:22,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1081, 'learning_rate': 9.230000000000001e-05, 'epoch': 1.04} +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:22,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:28,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:28,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1439, 'learning_rate': 9.240000000000001e-05, 'epoch': 1.04} +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:32,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 928/17840 [1:34:18<29:01:37, 6.18s/it]g-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 928/17840 [1:34:18<29:01:37, 6.18s/it]g-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:36,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:36,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:36,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:13:52,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 929/17840 [1:34:24<28:13:08, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 929/17840 [1:34:24<28:13:08, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:45,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:45,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2395, 'learning_rate': 9.27e-05, 'epoch': 1.04} +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:49,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:49,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 931/17840 [1:34:34<26:42:12, 5.69s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:52,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:55,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:55,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9298, 'learning_rate': 9.290000000000001e-05, 'epoch': 1.04} +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:59,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:15:59,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 933/17840 [1:34:45<25:11:17, 5.36s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:02,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:05,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:05,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:07,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:09,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:09,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:11,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:13,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:13,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:15,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:17,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:17,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:19,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:20,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:20,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:23,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:23,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:25,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:25,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:27,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:30,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:30,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:30,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:30,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5384, 'learning_rate': 9.39e-05, 'epoch': 1.06} +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:35,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:35,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:35,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:38,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:38,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:42,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:42,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:42,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 944/17840 [1:35:30<24:57:03, 5.32s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 944/17840 [1:35:30<24:57:03, 5.32s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 944/17840 [1:35:30<24:57:03, 5.32s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:53,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:53,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2995, 'learning_rate': 9.42e-05, 'epoch': 1.06} +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:53,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:53,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:16:53,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:35:45<29:51:27, 6.36s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:35:45<29:51:27, 6.36s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:35:45<29:51:27, 6.36s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:35:45<29:51:27, 6.36s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:35:45<29:51:27, 6.36s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 947/17840 [1:35:53<31:16:29, 6.66s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:17:12,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:17:12,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 948/17840 [1:36:00<32:19:13, 6.89s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 948/17840 [1:36:00<32:19:13, 6.89s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3144, 'learning_rate': 9.449999999999999e-05, 'epoch': 1.06} + 5%|███▉ | 948/17840 [1:36:00<32:19:13, 6.89s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 948/17840 [1:36:00<32:19:13, 6.89s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 948/17840 [1:36:00<32:19:13, 6.89s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 949/17840 [1:36:07<32:52:24, 7.01s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 949/17840 [1:36:07<32:52:24, 7.01s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:17:28,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 950/17840 [1:36:17<36:37:56, 7.81s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 950/17840 [1:36:17<36:37:56, 7.81s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1192, 'learning_rate': 9.47e-05, 'epoch': 1.07} + 5%|███▉ | 950/17840 [1:36:17<36:37:56, 7.81s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 950/17840 [1:36:17<36:37:56, 7.81s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 951/17840 [1:36:24<35:48:32, 7.63s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 951/17840 [1:36:24<35:48:32, 7.63s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0104, 'learning_rate': 9.48e-05, 'epoch': 1.07} + 5%|███▉ | 951/17840 [1:36:24<35:48:32, 7.63s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:17:47,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:17:47,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5124, 'learning_rate': 9.49e-05, 'epoch': 1.07} +[WARNING|modeling_utils.py:388] 2022-03-17 18:17:47,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:17:47,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 953/17840 [1:36:38<34:35:47, 7.38s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 953/17840 [1:36:38<34:35:47, 7.38s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2117, 'learning_rate': 9.5e-05, 'epoch': 1.07} + 5%|███▉ | 953/17840 [1:36:38<34:35:47, 7.38s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:01,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:01,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1834, 'learning_rate': 9.51e-05, 'epoch': 1.07} +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:01,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:01,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 955/17840 [1:36:52<33:40:52, 7.18s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 955/17840 [1:36:52<33:40:52, 7.18s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3039, 'learning_rate': 9.52e-05, 'epoch': 1.07} +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:13,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 956/17840 [1:36:59<33:20:22, 7.11s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 956/17840 [1:36:59<33:20:22, 7.11s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3042, 'learning_rate': 9.53e-05, 'epoch': 1.07} + 5%|███▉ | 956/17840 [1:36:59<33:20:22, 7.11s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 956/17840 [1:36:59<33:20:22, 7.11s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 956/17840 [1:36:59<33:20:22, 7.11s/it]g-point operations will not be computed-17 18:15:41,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 957/17840 [1:37:06<32:58:32, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 957/17840 [1:37:06<32:58:32, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 957/17840 [1:37:06<32:58:32, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 958/17840 [1:37:13<32:39:14, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 958/17840 [1:37:13<32:39:14, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:32,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:32,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 959/17840 [1:37:20<32:22:41, 6.90s/it]g-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 959/17840 [1:37:20<32:22:41, 6.90s/it]g-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4786, 'learning_rate': 9.56e-05, 'epoch': 1.08} + 5%|███▉ | 959/17840 [1:37:20<32:22:41, 6.90s/it]g-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:42,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:42,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0121, 'learning_rate': 9.57e-05, 'epoch': 1.08} +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:42,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:42,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 961/17840 [1:37:33<32:03:42, 6.84s/it]g-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 961/17840 [1:37:33<32:03:42, 6.84s/it]g-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:52,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:18:52,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 962/17840 [1:37:40<31:46:56, 6.78s/it]g-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 962/17840 [1:37:40<31:46:56, 6.78s/it]g-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0906, 'learning_rate': 9.59e-05, 'epoch': 1.08} + 5%|███▉ | 962/17840 [1:37:40<31:46:56, 6.78s/it]g-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:02,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:02,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2468, 'learning_rate': 9.6e-05, 'epoch': 1.08} +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:02,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:09,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:09,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4224, 'learning_rate': 9.61e-05, 'epoch': 1.08} +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:09,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:09,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:18:24,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 965/17840 [1:38:00<31:05:08, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 965/17840 [1:38:00<31:05:08, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9304, 'learning_rate': 9.620000000000001e-05, 'epoch': 1.08} + 5%|████ | 965/17840 [1:38:00<31:05:08, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 965/17840 [1:38:00<31:05:08, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 966/17840 [1:38:06<30:52:32, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:25,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:25,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 967/17840 [1:38:13<30:42:38, 6.55s/it]g-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 967/17840 [1:38:13<30:42:38, 6.55s/it]g-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2059, 'learning_rate': 9.64e-05, 'epoch': 1.08} +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:33,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:33,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 968/17840 [1:38:19<30:24:06, 6.49s/it]g-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 968/17840 [1:38:19<30:24:06, 6.49s/it]g-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:39,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:39,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 969/17840 [1:38:25<30:09:56, 6.44s/it]g-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 969/17840 [1:38:25<30:09:56, 6.44s/it]g-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 969/17840 [1:38:25<30:09:56, 6.44s/it]g-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 969/17840 [1:38:25<30:09:56, 6.44s/it]g-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:47,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:47,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:47,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:53,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:53,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2765, 'learning_rate': 9.680000000000001e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:53,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:53,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:59,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:59,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:59,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:19:59,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:06,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:06,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:06,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:06,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:12,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:12,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:12,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:12,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:12,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 975/17840 [1:39:04<31:53:15, 6.81s/it]g-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 975/17840 [1:39:04<31:53:15, 6.81s/it]g-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 975/17840 [1:39:04<31:53:15, 6.81s/it]g-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 975/17840 [1:39:04<31:53:15, 6.81s/it]g-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:26,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:30,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:30,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 977/17840 [1:39:16<29:30:24, 6.30s/it]g-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:34,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:34,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:34,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:19:17,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 978/17840 [1:39:22<28:37:41, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:20:39,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 978/17840 [1:39:22<28:37:41, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:20:39,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:43,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:39,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:43,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:39,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0044, 'learning_rate': 9.76e-05, 'epoch': 1.1} +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:47,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:39,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:47,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:39,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 980/17840 [1:39:32<26:50:56, 5.73s/it]g-point operations will not be computed-17 18:20:39,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:51,108 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:39,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:51,108 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:39,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:51,108 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:39,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 981/17840 [1:39:38<25:58:15, 5.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:57,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:20:57,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 982/17840 [1:39:43<25:13:13, 5.39s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:00,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:03,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:03,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:05,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:07,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:07,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:09,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:11,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:11,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:13,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:15,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:15,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:17,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:17,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:18,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:21,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:21,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:23,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:23,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:25,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:25,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:27,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:29,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:29,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:31,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:31,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0894, 'learning_rate': 9.89e-05, 'epoch': 1.11} +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:35,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:35,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:35,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:38,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:38,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:42,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:42,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:42,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:46,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:46,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:46,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:46,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:46,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 995/17840 [1:40:38<27:42:32, 5.92s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:57,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:57,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:21:57,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 996/17840 [1:40:46<29:43:42, 6.35s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 996/17840 [1:40:46<29:43:42, 6.35s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 996/17840 [1:40:46<29:43:42, 6.35s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 996/17840 [1:40:46<29:43:42, 6.35s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 996/17840 [1:40:46<29:43:42, 6.35s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 997/17840 [1:40:53<31:07:44, 6.65s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 997/17840 [1:40:53<31:07:44, 6.65s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 997/17840 [1:40:53<31:07:44, 6.65s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:16,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:16,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4368, 'learning_rate': 9.95e-05, 'epoch': 1.12} +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:16,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:16,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:16,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 999/17840 [1:41:07<32:27:31, 6.94s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 999/17840 [1:41:07<32:27:31, 6.94s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:28,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:28,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1000/17840 [1:41:17<36:14:17, 7.75s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1000/17840 [1:41:17<36:14:17, 7.75s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:38,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1001/17840 [1:41:24<35:34:35, 7.61s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1001/17840 [1:41:24<35:34:35, 7.61s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3951, 'learning_rate': 9.98e-05, 'epoch': 1.12} + 6%|████ | 1001/17840 [1:41:24<35:34:35, 7.61s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1001/17840 [1:41:24<35:34:35, 7.61s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1001/17840 [1:41:24<35:34:35, 7.61s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1002/17840 [1:41:31<34:42:24, 7.42s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:50,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:22:50,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:41:38<34:07:57, 7.30s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:41:38<34:07:57, 7.30s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1558, 'learning_rate': 0.0001, 'epoch': 1.12} + 6%|████ | 1003/17840 [1:41:38<34:07:57, 7.30s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:41:38<34:07:57, 7.30s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:41:38<34:07:57, 7.30s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1004/17840 [1:41:45<33:40:55, 7.20s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:04,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:04,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:04,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1005/17840 [1:41:52<33:24:20, 7.14s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1005/17840 [1:41:52<33:24:20, 7.14s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:13,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1006/17840 [1:41:59<33:10:11, 7.09s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1006/17840 [1:41:59<33:10:11, 7.09s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.174, 'learning_rate': 9.998218527315915e-05, 'epoch': 1.13} + 6%|████ | 1006/17840 [1:41:59<33:10:11, 7.09s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1006/17840 [1:41:59<33:10:11, 7.09s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1006/17840 [1:41:59<33:10:11, 7.09s/it]g-point operations will not be computed-17 18:20:54,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1007/17840 [1:42:06<32:50:59, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:27,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:27,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1008/17840 [1:42:13<32:32:21, 6.96s/it]g-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1008/17840 [1:42:13<32:32:21, 6.96s/it]g-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1008/17840 [1:42:13<32:32:21, 6.96s/it]g-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:35,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:35,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1418, 'learning_rate': 9.99643705463183e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:35,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:35,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:35,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1010/17840 [1:42:26<32:05:13, 6.86s/it]g-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:45,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:45,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1011/17840 [1:42:33<31:55:46, 6.83s/it]g-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1011/17840 [1:42:33<31:55:46, 6.83s/it]g-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1272, 'learning_rate': 9.995249406175773e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-17 18:23:54,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1012/17840 [1:42:40<31:48:18, 6.80s/it]g-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1012/17840 [1:42:40<31:48:18, 6.80s/it]g-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9955, 'learning_rate': 9.994655581947743e-05, 'epoch': 1.13} + 6%|████▏ | 1012/17840 [1:42:40<31:48:18, 6.80s/it]g-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1012/17840 [1:42:40<31:48:18, 6.80s/it]g-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1012/17840 [1:42:40<31:48:18, 6.80s/it]g-point operations will not be computed-17 18:23:23,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1013/17840 [1:42:46<31:26:56, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1013/17840 [1:42:46<31:26:56, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1013/17840 [1:42:46<31:26:56, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1013/17840 [1:42:46<31:26:56, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1014/17840 [1:42:53<31:18:47, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:12,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:12,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1015/17840 [1:43:00<31:03:45, 6.65s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1015/17840 [1:43:00<31:03:45, 6.65s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9606, 'learning_rate': 9.992874109263658e-05, 'epoch': 1.14} +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:20,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1016/17840 [1:43:06<30:57:07, 6.62s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1016/17840 [1:43:06<30:57:07, 6.62s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1703, 'learning_rate': 9.99228028503563e-05, 'epoch': 1.14} +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:26,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:26,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:26,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8666, 'learning_rate': 9.991686460807601e-05, 'epoch': 1.14} +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:26,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:35,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:35,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1392, 'learning_rate': 9.991092636579573e-05, 'epoch': 1.14} +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:35,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:35,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1019/17840 [1:43:26<30:27:41, 6.52s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1019/17840 [1:43:26<30:27:41, 6.52s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:44,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:44,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1020/17840 [1:43:32<30:12:06, 6.46s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1020/17840 [1:43:32<30:12:06, 6.46s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:51,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:51,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1021/17840 [1:43:38<29:58:11, 6.41s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1021/17840 [1:43:38<29:58:11, 6.41s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:57,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:24:57,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1022/17840 [1:43:44<29:45:29, 6.37s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1022/17840 [1:43:44<29:45:29, 6.37s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:03,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:03,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1023/17840 [1:43:51<29:35:12, 6.33s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1023/17840 [1:43:51<29:35:12, 6.33s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:09,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:09,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1024/17840 [1:43:57<29:17:48, 6.27s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1024/17840 [1:43:57<29:17:48, 6.27s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:15,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:15,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1025/17840 [1:44:05<32:05:32, 6.87s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1025/17840 [1:44:05<32:05:32, 6.87s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2235, 'learning_rate': 9.986935866983373e-05, 'epoch': 1.15} +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:25,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1026/17840 [1:44:11<30:47:37, 6.59s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1026/17840 [1:44:11<30:47:37, 6.59s/it]g-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:29,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:29,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:24:04,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1027/17840 [1:44:17<29:36:36, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:25:34,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1027/17840 [1:44:17<29:36:36, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:25:34,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.345, 'learning_rate': 9.985748218527317e-05, 'epoch': 1.15} + 6%|████▏ | 1027/17840 [1:44:17<29:36:36, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:25:34,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:38,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:25:34,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:38,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:25:34,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:42,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:25:34,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:42,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:25:34,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1029/17840 [1:44:28<27:52:13, 5.97s/it]g-point operations will not be computed-17 18:25:34,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:46,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:25:34,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:46,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:25:34,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:46,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:25:34,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1030/17840 [1:44:33<27:07:02, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:25:50,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1030/17840 [1:44:33<27:07:02, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:25:50,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:54,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:25:50,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:54,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:25:50,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1832, 'learning_rate': 9.983372921615203e-05, 'epoch': 1.16} +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:58,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:25:50,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:25:58,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:25:50,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1032/17840 [1:44:44<25:35:27, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1032/17840 [1:44:44<25:35:27, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1032/17840 [1:44:44<25:35:27, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:04,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:07,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:09,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:09,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:11,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:13,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:13,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:15,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:17,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:17,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:19,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:21,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:21,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:22,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:22,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:24,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:27,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:27,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:29,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:29,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:30,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:30,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:33,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:33,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:34,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:34,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:38,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:41,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:41,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3064, 'learning_rate': 9.97624703087886e-05, 'epoch': 1.17} +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:45,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:45,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:49,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:49,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1285, 'learning_rate': 9.975653206650832e-05, 'epoch': 1.17} +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:49,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:49,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:26:49,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1045/17840 [1:45:41<27:25:50, 5.88s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1045/17840 [1:45:41<27:25:50, 5.88s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1045/17840 [1:45:41<27:25:50, 5.88s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1045/17840 [1:45:41<27:25:50, 5.88s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1045/17840 [1:45:41<27:25:50, 5.88s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:45:48<29:35:08, 6.34s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:07,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:07,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1047/17840 [1:45:56<31:00:39, 6.65s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1047/17840 [1:45:56<31:00:39, 6.65s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0813, 'learning_rate': 9.973871733966747e-05, 'epoch': 1.17} + 6%|████▎ | 1047/17840 [1:45:56<31:00:39, 6.65s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1047/17840 [1:45:56<31:00:39, 6.65s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1047/17840 [1:45:56<31:00:39, 6.65s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1048/17840 [1:46:03<31:51:53, 6.83s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:22,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:22,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1049/17840 [1:46:10<32:23:21, 6.94s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1049/17840 [1:46:10<32:23:21, 6.94s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7178, 'learning_rate': 9.97268408551069e-05, 'epoch': 1.18} + 6%|████▎ | 1049/17840 [1:46:10<32:23:21, 6.94s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1049/17840 [1:46:10<32:23:21, 6.94s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1050/17840 [1:46:20<36:02:27, 7.73s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1050/17840 [1:46:20<36:02:27, 7.73s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5737, 'learning_rate': 9.97209026128266e-05, 'epoch': 1.18} + 6%|████▎ | 1050/17840 [1:46:20<36:02:27, 7.73s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:42,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:42,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0987, 'learning_rate': 9.971496437054632e-05, 'epoch': 1.18} +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:42,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:42,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1052/17840 [1:46:34<34:51:06, 7.47s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1052/17840 [1:46:34<34:51:06, 7.47s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3367, 'learning_rate': 9.970902612826603e-05, 'epoch': 1.18} + 6%|████▎ | 1052/17840 [1:46:34<34:51:06, 7.47s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:57,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:57,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1949, 'learning_rate': 9.970308788598575e-05, 'epoch': 1.18} +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:57,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:27:57,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1054/17840 [1:46:48<33:48:03, 7.25s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1054/17840 [1:46:48<33:48:03, 7.25s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8049, 'learning_rate': 9.969714964370547e-05, 'epoch': 1.18} + 6%|████▎ | 1054/17840 [1:46:48<33:48:03, 7.25s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:11,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:11,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2465, 'learning_rate': 9.969121140142518e-05, 'epoch': 1.18} +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:11,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:11,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:11,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1056/17840 [1:47:02<33:02:37, 7.09s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:21,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:21,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1057/17840 [1:47:09<32:37:49, 7.00s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1057/17840 [1:47:09<32:37:49, 7.00s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.42, 'learning_rate': 9.96793349168646e-05, 'epoch': 1.18} + 6%|████▎ | 1057/17840 [1:47:09<32:37:49, 7.00s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:31,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:31,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0213, 'learning_rate': 9.967339667458433e-05, 'epoch': 1.19} +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:31,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:31,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1059/17840 [1:47:22<32:04:51, 6.88s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1059/17840 [1:47:22<32:04:51, 6.88s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:41,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:41,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1060/17840 [1:47:29<31:53:46, 6.84s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1060/17840 [1:47:29<31:53:46, 6.84s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2884, 'learning_rate': 9.966152019002377e-05, 'epoch': 1.19} + 6%|████▎ | 1060/17840 [1:47:29<31:53:46, 6.84s/it]g-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:51,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:51,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2611, 'learning_rate': 9.965558194774347e-05, 'epoch': 1.19} +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:51,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:28:51,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:26:01,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1062/17840 [1:47:43<31:35:10, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1062/17840 [1:47:43<31:35:10, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6643, 'learning_rate': 9.96496437054632e-05, 'epoch': 1.19} + 6%|████▎ | 1062/17840 [1:47:43<31:35:10, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1063/17840 [1:47:49<31:29:27, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1063/17840 [1:47:49<31:29:27, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:08,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:08,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1064/17840 [1:47:56<31:17:22, 6.71s/it]g-point operations will not be computed-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1064/17840 [1:47:56<31:17:22, 6.71s/it]g-point operations will not be computed-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2878, 'learning_rate': 9.963776722090262e-05, 'epoch': 1.19} + 6%|████▎ | 1064/17840 [1:47:56<31:17:22, 6.71s/it]g-point operations will not be computed-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:18,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:18,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2502, 'learning_rate': 9.963182897862233e-05, 'epoch': 1.19} +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:18,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:18,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:18,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:00,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1066/17840 [1:48:09<30:54:03, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1066/17840 [1:48:09<30:54:03, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1066/17840 [1:48:09<30:54:03, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1067/17840 [1:48:15<30:38:06, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1067/17840 [1:48:15<30:38:06, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:34,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:34,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1068/17840 [1:48:22<30:18:47, 6.51s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1068/17840 [1:48:22<30:18:47, 6.51s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:41,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:41,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1069/17840 [1:48:28<30:14:16, 6.49s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1069/17840 [1:48:28<30:14:16, 6.49s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3081, 'learning_rate': 9.96080760095012e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:49,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1070/17840 [1:48:35<30:11:50, 6.48s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1070/17840 [1:48:35<30:11:50, 6.48s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3346, 'learning_rate': 9.96021377672209e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-17 18:29:55,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1071/17840 [1:48:41<29:52:08, 6.41s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1071/17840 [1:48:41<29:52:08, 6.41s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4364, 'learning_rate': 9.959619952494062e-05, 'epoch': 1.2} + 6%|████▍ | 1071/17840 [1:48:41<29:52:08, 6.41s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1071/17840 [1:48:41<29:52:08, 6.41s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:03,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:03,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:03,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:09,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:09,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1174, 'learning_rate': 9.958432304038005e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:09,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:09,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:15,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:15,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:19,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:19,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1075/17840 [1:49:08<31:51:50, 6.84s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1075/17840 [1:49:08<31:51:50, 6.84s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:28,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:28,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1076/17840 [1:49:14<30:34:12, 6.56s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1076/17840 [1:49:14<30:34:12, 6.56s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:33,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:33,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1077/17840 [1:49:19<29:28:18, 6.33s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:38,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:38,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:38,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1078/17840 [1:49:25<28:35:27, 6.14s/it]g-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:43,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:43,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:43,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:29:26,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1079/17840 [1:49:31<27:45:15, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:30:48,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1079/17840 [1:49:31<27:45:15, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:30:48,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1079/17840 [1:49:31<27:45:15, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:30:48,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:51,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:48,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:54,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:48,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:54,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:48,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:30:54,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:48,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1081/17840 [1:49:41<26:08:03, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:30:58,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1081/17840 [1:49:41<26:08:03, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:30:58,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1081/17840 [1:49:41<26:08:03, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:30:58,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:02,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:58,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:04,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:58,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:06,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:58,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:06,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:58,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2573, 'learning_rate': 9.95249406175772e-05, 'epoch': 1.21} +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:10,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:58,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:10,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:30:58,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1084/17840 [1:49:55<23:16:28, 5.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:12,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:14,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:12,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:14,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:12,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1085/17840 [1:50:00<22:08:14, 4.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:16,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:18,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:16,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:18,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:16,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1086/17840 [1:50:04<20:57:56, 4.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1087/17840 [1:50:07<19:42:07, 4.23s/it]g-point operations will not be computed-17 18:31:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1087/17840 [1:50:07<19:42:07, 4.23s/it]g-point operations will not be computed-17 18:31:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1087/17840 [1:50:07<19:42:07, 4.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:24,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1087/17840 [1:50:07<19:42:07, 4.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:24,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1088/17840 [1:50:10<18:20:39, 3.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:27,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:28,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:27,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:28,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:27,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1089/17840 [1:50:14<17:12:21, 3.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:30,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1089/17840 [1:50:14<17:12:21, 3.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:30,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1090/17840 [1:50:16<15:52:43, 3.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:32,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1090/17840 [1:50:16<15:52:43, 3.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:32,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1091/17840 [1:50:19<14:27:29, 3.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:35,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:50:21<13:01:06, 2.80s/it]g-point operations will not be computed-17 18:31:35,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:50:21<13:01:06, 2.80s/it]g-point operations will not be computed-17 18:31:35,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:50:21<13:01:06, 2.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:38,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:50:21<13:01:06, 2.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:38,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:42,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:38,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:42,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:38,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1093/17840 [1:50:29<20:06:22, 4.32s/it]g-point operations will not be computed-17 18:31:38,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1093/17840 [1:50:29<20:06:22, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1093/17840 [1:50:29<20:06:22, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:50,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:31:50,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:50:36<24:43:46, 5.32s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:50:36<24:43:46, 5.32s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:50:36<24:43:46, 5.32s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:50:36<24:43:46, 5.32s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:50:36<24:43:46, 5.32s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1095/17840 [1:50:44<27:40:00, 5.95s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1095/17840 [1:50:44<27:40:00, 5.95s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:05,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:50:51<29:49:24, 6.41s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:50:51<29:49:24, 6.41s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5259, 'learning_rate': 9.94477434679335e-05, 'epoch': 1.23} + 6%|████▍ | 1096/17840 [1:50:51<29:49:24, 6.41s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:50:51<29:49:24, 6.41s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:50:51<29:49:24, 6.41s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1097/17840 [1:50:59<31:13:26, 6.71s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1097/17840 [1:50:59<31:13:26, 6.71s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1097/17840 [1:50:59<31:13:26, 6.71s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:21,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:21,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4222, 'learning_rate': 9.943586698337292e-05, 'epoch': 1.23} +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:21,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:21,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:21,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:51:13<32:29:25, 6.99s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:51:13<32:29:25, 6.99s/it]g-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:34,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:34,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:31:46,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:51:23<36:16:09, 7.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:51:23<36:16:09, 7.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:51:23<36:16:09, 7.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1101/17840 [1:51:30<35:34:00, 7.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1101/17840 [1:51:30<35:34:00, 7.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4343, 'learning_rate': 9.941805225653207e-05, 'epoch': 1.23} + 6%|████▌ | 1101/17840 [1:51:30<35:34:00, 7.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1101/17840 [1:51:30<35:34:00, 7.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1101/17840 [1:51:30<35:34:00, 7.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1102/17840 [1:51:37<34:56:57, 7.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:56,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:32:56,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1103/17840 [1:51:44<34:17:18, 7.38s/it]g-point operations will not be computed-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1103/17840 [1:51:44<34:17:18, 7.38s/it]g-point operations will not be computed-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0815, 'learning_rate': 9.94061757719715e-05, 'epoch': 1.24} + 6%|████▌ | 1103/17840 [1:51:44<34:17:18, 7.38s/it]g-point operations will not be computed-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:07,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:07,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2368, 'learning_rate': 9.940023752969122e-05, 'epoch': 1.24} +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:07,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:07,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:51:59<33:31:34, 7.21s/it]g-point operations will not be computed-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:51:59<33:31:34, 7.21s/it]g-point operations will not be computed-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2828, 'learning_rate': 9.939429928741093e-05, 'epoch': 1.24} + 6%|████▌ | 1105/17840 [1:51:59<33:31:34, 7.21s/it]g-point operations will not be computed-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:51:59<33:31:34, 7.21s/it]g-point operations will not be computed-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:51:59<33:31:34, 7.21s/it]g-point operations will not be computed-17 18:32:40,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1106/17840 [1:52:05<33:05:07, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1106/17840 [1:52:05<33:05:07, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1106/17840 [1:52:05<33:05:07, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1107/17840 [1:52:12<32:51:04, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1107/17840 [1:52:12<32:51:04, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4668, 'learning_rate': 9.938242280285037e-05, 'epoch': 1.24} +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:33,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1108/17840 [1:52:19<32:34:43, 7.01s/it]g-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1108/17840 [1:52:19<32:34:43, 7.01s/it]g-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2805, 'learning_rate': 9.937648456057007e-05, 'epoch': 1.24} + 6%|████▌ | 1108/17840 [1:52:19<32:34:43, 7.01s/it]g-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:42,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:42,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2217, 'learning_rate': 9.93705463182898e-05, 'epoch': 1.24} +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:42,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:42,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1110/17840 [1:52:33<32:10:23, 6.92s/it]g-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1110/17840 [1:52:33<32:10:23, 6.92s/it]g-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:52,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:33:52,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1111/17840 [1:52:40<31:54:15, 6.87s/it]g-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1111/17840 [1:52:40<31:54:15, 6.87s/it]g-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1554, 'learning_rate': 9.935866983372922e-05, 'epoch': 1.25} + 6%|████▌ | 1111/17840 [1:52:40<31:54:15, 6.87s/it]g-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:02,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:02,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1566, 'learning_rate': 9.935273159144893e-05, 'epoch': 1.25} +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:02,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:02,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:33:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1113/17840 [1:52:53<31:29:21, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:34:10,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1113/17840 [1:52:53<31:29:21, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:34:10,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2904, 'learning_rate': 9.934679334916865e-05, 'epoch': 1.25} + 6%|████▌ | 1113/17840 [1:52:53<31:29:21, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:34:10,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1114/17840 [1:53:00<31:20:09, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:34:10,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1114/17840 [1:53:00<31:20:09, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:34:10,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2368, 'learning_rate': 9.934085510688837e-05, 'epoch': 1.25} +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:20,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:10,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1115/17840 [1:53:06<31:18:52, 6.74s/it]g-point operations will not be computed-17 18:34:10,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1115/17840 [1:53:06<31:18:52, 6.74s/it]g-point operations will not be computed-17 18:34:10,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0622, 'learning_rate': 9.933491686460809e-05, 'epoch': 1.25} + 6%|████▌ | 1115/17840 [1:53:06<31:18:52, 6.74s/it]g-point operations will not be computed-17 18:34:10,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:29,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:10,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:29,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:10,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1278, 'learning_rate': 9.93289786223278e-05, 'epoch': 1.25} +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:29,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:10,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:29,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:10,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1117/17840 [1:53:20<30:50:25, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1117/17840 [1:53:20<30:50:25, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1799, 'learning_rate': 9.932304038004752e-05, 'epoch': 1.25} + 6%|████▌ | 1117/17840 [1:53:20<30:50:25, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1118/17840 [1:53:26<30:34:41, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1118/17840 [1:53:26<30:34:41, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5165, 'learning_rate': 9.931710213776722e-05, 'epoch': 1.25} +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:46,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:46,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1119/17840 [1:53:32<30:17:50, 6.52s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1119/17840 [1:53:32<30:17:50, 6.52s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:53,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:53,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1120/17840 [1:53:39<30:05:23, 6.48s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1120/17840 [1:53:39<30:05:23, 6.48s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:59,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:34:59,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1121/17840 [1:53:45<29:56:06, 6.45s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1121/17840 [1:53:45<29:56:06, 6.45s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:05,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1122/17840 [1:53:51<29:38:18, 6.38s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1122/17840 [1:53:51<29:38:18, 6.38s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1778, 'learning_rate': 9.929334916864609e-05, 'epoch': 1.26} + 6%|████▌ | 1122/17840 [1:53:51<29:38:18, 6.38s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1122/17840 [1:53:51<29:38:18, 6.38s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:13,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:13,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:13,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:13,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:19,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:19,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:19,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:19,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1125/17840 [1:54:12<31:51:54, 6.86s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1125/17840 [1:54:12<31:51:54, 6.86s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4404, 'learning_rate': 9.927553444180522e-05, 'epoch': 1.26} + 6%|████▌ | 1125/17840 [1:54:12<31:51:54, 6.86s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1125/17840 [1:54:12<31:51:54, 6.86s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:33,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:33,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:38,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:38,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1127/17840 [1:54:24<29:21:15, 6.32s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1127/17840 [1:54:24<29:21:15, 6.32s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:43,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:43,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1128/17840 [1:54:29<28:24:47, 6.12s/it]g-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:48,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:48,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:48,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:34:37,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1129/17840 [1:54:35<27:41:00, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:52,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1129/17840 [1:54:35<27:41:00, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:52,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1129/17840 [1:54:35<27:41:00, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:35:52,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:56,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:52,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:35:56,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:52,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:52,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:00,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:52,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1131/17840 [1:54:45<26:05:02, 5.62s/it]g-point operations will not be computed-17 18:35:52,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:03,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:52,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:06,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:52,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:06,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:52,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1902, 'learning_rate': 9.923396674584323e-05, 'epoch': 1.27} +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:09,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:52,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:09,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:35:52,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1133/17840 [1:54:55<24:08:59, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:12,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:14,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:12,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:14,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:12,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1134/17840 [1:55:00<23:02:50, 4.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:16,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:18,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:16,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:18,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:16,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1135/17840 [1:55:04<21:45:16, 4.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:20,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:22,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:20,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:22,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:20,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1136/17840 [1:55:07<20:29:34, 4.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:24,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1136/17840 [1:55:07<20:29:34, 4.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:24,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1137/17840 [1:55:11<19:05:11, 4.11s/it]g-point operations will not be computed-17 18:36:24,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1137/17840 [1:55:11<19:05:11, 4.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:27,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1137/17840 [1:55:11<19:05:11, 4.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:27,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1138/17840 [1:55:14<17:40:24, 3.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:30,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1138/17840 [1:55:14<17:40:24, 3.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:30,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1139/17840 [1:55:17<16:14:46, 3.50s/it]g-point operations will not be computed-17 18:36:30,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:34,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:33,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:34,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:33,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:36,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:35,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:36,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:35,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:39,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:38,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:39,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:38,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1142/17840 [1:55:24<12:29:58, 2.69s/it]g-point operations will not be computed-17 18:36:38,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1142/17840 [1:55:24<12:29:58, 2.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:41,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1142/17840 [1:55:24<12:29:58, 2.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:41,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:45,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:41,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:45,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:41,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1143/17840 [1:55:31<19:29:02, 4.20s/it]g-point operations will not be computed-17 18:36:41,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1143/17840 [1:55:31<19:29:02, 4.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:49,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:52,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:49,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:36:52,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:36:49,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1144/17840 [1:55:39<23:59:08, 5.17s/it]g-point operations will not be computed-17 18:36:49,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1144/17840 [1:55:39<23:59:08, 5.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:56,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1144/17840 [1:55:39<23:59:08, 5.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:56,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1144/17840 [1:55:39<23:59:08, 5.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:56,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1144/17840 [1:55:39<23:59:08, 5.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:56,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:55:46<27:09:40, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:56,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:55:46<27:09:40, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:56,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:55:46<27:09:40, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:56,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:55:46<27:09:40, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:56,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:55:46<27:09:40, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:36:56,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1146/17840 [1:55:54<29:13:44, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1146/17840 [1:55:54<29:13:44, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1146/17840 [1:55:54<29:13:44, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1146/17840 [1:55:54<29:13:44, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1147/17840 [1:56:01<30:34:18, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1147/17840 [1:56:01<30:34:18, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1147/17840 [1:56:01<30:34:18, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1147/17840 [1:56:01<30:34:18, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1147/17840 [1:56:01<30:34:18, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:11,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1148/17840 [1:56:08<31:27:27, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1148/17840 [1:56:08<31:27:27, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1148/17840 [1:56:08<31:27:27, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1148/17840 [1:56:08<31:27:27, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1149/17840 [1:56:15<32:00:23, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|███��▋ | 1149/17840 [1:56:15<32:00:23, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1149/17840 [1:56:15<32:00:23, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1149/17840 [1:56:15<32:00:23, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1149/17840 [1:56:15<32:00:23, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:56:25<35:49:13, 7.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:56:25<35:49:13, 7.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:37:46,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:56:32<35:05:27, 7.57s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:56:32<35:05:27, 7.57s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4716, 'learning_rate': 9.912114014251782e-05, 'epoch': 1.29} + 6%|████▋ | 1151/17840 [1:56:32<35:05:27, 7.57s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:56:32<35:05:27, 7.57s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:56:32<35:05:27, 7.57s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:56:39<34:28:12, 7.44s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:56:39<34:28:12, 7.44s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:56:39<34:28:12, 7.44s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:56:39<34:28:12, 7.44s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:02,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:02,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:02,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:02,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:02,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1154/17840 [1:56:53<33:29:46, 7.23s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:12,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:12,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1155/17840 [1:57:00<33:18:07, 7.19s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1155/17840 [1:57:00<33:18:07, 7.19s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4021, 'learning_rate': 9.909738717339669e-05, 'epoch': 1.29} + 6%|████▋ | 1155/17840 [1:57:00<33:18:07, 7.19s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:23,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:23,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.969, 'learning_rate': 9.909144893111639e-05, 'epoch': 1.3} +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:23,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:23,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:23,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1157/17840 [1:57:14<32:30:41, 7.02s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:33,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:33,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1158/17840 [1:57:21<32:12:25, 6.95s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1158/17840 [1:57:21<32:12:25, 6.95s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3404, 'learning_rate': 9.907957244655582e-05, 'epoch': 1.3} + 6%|████▋ | 1158/17840 [1:57:21<32:12:25, 6.95s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1158/17840 [1:57:21<32:12:25, 6.95s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1158/17840 [1:57:21<32:12:25, 6.95s/it]g-point operations will not be computed-17 18:37:25,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1159/17840 [1:57:28<32:01:08, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1159/17840 [1:57:28<32:01:08, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1159/17840 [1:57:28<32:01:08, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1159/17840 [1:57:28<32:01:08, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▋ | 1160/17840 [1:57:34<31:49:42, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:53,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:38:53,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1161/17840 [1:57:41<31:31:26, 6.80s/it]g-point operations will not be computed-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1161/17840 [1:57:41<31:31:26, 6.80s/it]g-point operations will not be computed-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1172, 'learning_rate': 9.906175771971497e-05, 'epoch': 1.3} + 7%|████▊ | 1161/17840 [1:57:41<31:31:26, 6.80s/it]g-point operations will not be computed-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:03,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:03,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0968, 'learning_rate': 9.905581947743469e-05, 'epoch': 1.3} +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:03,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:03,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:03,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:38:45,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1163/17840 [1:57:54<31:12:43, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1163/17840 [1:57:54<31:12:43, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1163/17840 [1:57:54<31:12:43, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1163/17840 [1:57:54<31:12:43, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1164/17840 [1:58:01<31:08:34, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:20,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:20,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1165/17840 [1:58:08<30:50:09, 6.66s/it]g-point operations will not be computed-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1165/17840 [1:58:08<30:50:09, 6.66s/it]g-point operations will not be computed-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6928, 'learning_rate': 9.903800475059382e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:28,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1166/17840 [1:58:14<30:33:55, 6.60s/it]g-point operations will not be computed-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1166/17840 [1:58:14<30:33:55, 6.60s/it]g-point operations will not be computed-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0706, 'learning_rate': 9.903206650831354e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:34,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1167/17840 [1:58:21<30:20:45, 6.55s/it]g-point operations will not be computed-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1167/17840 [1:58:21<30:20:45, 6.55s/it]g-point operations will not be computed-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2401, 'learning_rate': 9.902612826603326e-05, 'epoch': 1.31} + 7%|████▊ | 1167/17840 [1:58:21<30:20:45, 6.55s/it]g-point operations will not be computed-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1167/17840 [1:58:21<30:20:45, 6.55s/it]g-point operations will not be computed-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1167/17840 [1:58:21<30:20:45, 6.55s/it]g-point operations will not be computed-17 18:39:12,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1168/17840 [1:58:27<30:08:25, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1168/17840 [1:58:27<30:08:25, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1168/17840 [1:58:27<30:08:25, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1168/17840 [1:58:27<30:08:25, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1169/17840 [1:58:33<30:04:35, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:52,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:52,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:52,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1170/17840 [1:58:40<29:38:54, 6.40s/it]g-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:58,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:58,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:39:58,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1171/17840 [1:58:46<29:26:40, 6.36s/it]g-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:05,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:05,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1172/17840 [1:58:52<29:23:50, 6.35s/it]g-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1172/17840 [1:58:52<29:23:50, 6.35s/it]g-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5761, 'learning_rate': 9.899643705463182e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:12,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1173/17840 [1:58:58<29:07:37, 6.29s/it]g-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1173/17840 [1:58:58<29:07:37, 6.29s/it]g-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:17,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:17,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1174/17840 [1:59:04<28:44:59, 6.21s/it]g-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1174/17840 [1:59:04<28:44:59, 6.21s/it]g-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:23,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:23,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1175/17840 [1:59:13<31:39:37, 6.84s/it]g-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1175/17840 [1:59:13<31:39:37, 6.84s/it]g-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:31,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:31,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1176/17840 [1:59:19<30:28:26, 6.58s/it]g-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1176/17840 [1:59:19<30:28:26, 6.58s/it]g-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2875, 'learning_rate': 9.897268408551069e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:38,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1177/17840 [1:59:24<29:21:30, 6.34s/it]g-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1177/17840 [1:59:24<29:21:30, 6.34s/it]g-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:43,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:43,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:43,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:39:44,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1178/17840 [1:59:30<28:26:24, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:47,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1178/17840 [1:59:30<28:26:24, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:40:47,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:51,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:47,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:51,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:47,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.274, 'learning_rate': 9.895486935866984e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:55,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:47,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1180/17840 [1:59:41<26:51:40, 5.80s/it]g-point operations will not be computed-17 18:40:47,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1180/17840 [1:59:41<26:51:40, 5.80s/it]g-point operations will not be computed-17 18:40:47,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:40:59,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:47,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:02,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:47,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:02,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:47,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.006, 'learning_rate': 9.894299287410927e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:05,923 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:47,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:05,923 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:40:47,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1182/17840 [1:59:51<24:59:41, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1182/17840 [1:59:51<24:59:41, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1182/17840 [1:59:51<24:59:41, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:11,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:14,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:14,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:16,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:18,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:18,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:20,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:22,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:22,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:24,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:25,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:25,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:27,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:30,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:30,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:32,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:32,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:34,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:34,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:36,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:36,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:38,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:38,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:40,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:40,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:44,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:44,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:44,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:48,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:48,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:52,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:52,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:52,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:55,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:55,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:55,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:55,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:41:55,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:41:08,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1195/17840 [2:00:47<27:28:32, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:08,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:08,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1196/17840 [2:00:55<29:27:59, 6.37s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1196/17840 [2:00:55<29:27:59, 6.37s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1196/17840 [2:00:55<29:27:59, 6.37s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1196/17840 [2:00:55<29:27:59, 6.37s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1196/17840 [2:00:55<29:27:59, 6.37s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1197/17840 [2:01:02<30:43:30, 6.65s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1197/17840 [2:01:02<30:43:30, 6.65s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1197/17840 [2:01:02<30:43:30, 6.65s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:25,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:25,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3885, 'learning_rate': 9.884204275534442e-05, 'epoch': 1.34} +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:25,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:25,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:25,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1199/17840 [2:01:17<32:14:14, 6.97s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1199/17840 [2:01:17<32:14:14, 6.97s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1199/17840 [2:01:17<32:14:14, 6.97s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1199/17840 [2:01:17<32:14:14, 6.97s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1199/17840 [2:01:17<32:14:14, 6.97s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1200/17840 [2:01:26<35:55:46, 7.77s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1200/17840 [2:01:26<35:55:46, 7.77s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:42:47,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1201/17840 [2:01:34<35:18:09, 7.64s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1201/17840 [2:01:34<35:18:09, 7.64s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0712, 'learning_rate': 9.882422802850356e-05, 'epoch': 1.35} + 7%|████▉ | 1201/17840 [2:01:34<35:18:09, 7.64s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1201/17840 [2:01:34<35:18:09, 7.64s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1201/17840 [2:01:34<35:18:09, 7.64s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1202/17840 [2:01:41<34:36:42, 7.49s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1202/17840 [2:01:41<34:36:42, 7.49s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:02,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1203/17840 [2:01:48<34:02:24, 7.37s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1203/17840 [2:01:48<34:02:24, 7.37s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1059, 'learning_rate': 9.881235154394299e-05, 'epoch': 1.35} + 7%|████▉ | 1203/17840 [2:01:48<34:02:24, 7.37s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1203/17840 [2:01:48<34:02:24, 7.37s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1203/17840 [2:01:48<34:02:24, 7.37s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1204/17840 [2:01:55<33:37:57, 7.28s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:14,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:14,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1205/17840 [2:02:02<33:10:05, 7.18s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1205/17840 [2:02:02<33:10:05, 7.18s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0692, 'learning_rate': 9.880047505938242e-05, 'epoch': 1.35} + 7%|████▉ | 1205/17840 [2:02:02<33:10:05, 7.18s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1205/17840 [2:02:02<33:10:05, 7.18s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1205/17840 [2:02:02<33:10:05, 7.18s/it]g-point operations will not be computed-17 18:42:05,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1206/17840 [2:02:09<32:52:11, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1206/17840 [2:02:09<32:52:11, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1206/17840 [2:02:09<32:52:11, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1206/17840 [2:02:09<32:52:11, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1207/17840 [2:02:16<32:29:12, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1207/17840 [2:02:16<32:29:12, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:36,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1208/17840 [2:02:23<32:14:35, 6.98s/it]g-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1208/17840 [2:02:23<32:14:35, 6.98s/it]g-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4814, 'learning_rate': 9.878266033254158e-05, 'epoch': 1.35} + 7%|████▉ | 1208/17840 [2:02:23<32:14:35, 6.98s/it]g-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:45,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:45,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.272, 'learning_rate': 9.877672209026129e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:45,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:45,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1210/17840 [2:02:36<31:53:19, 6.90s/it]g-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1210/17840 [2:02:36<31:53:19, 6.90s/it]g-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:55,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:43:55,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1211/17840 [2:02:43<31:32:01, 6.83s/it]g-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1211/17840 [2:02:43<31:32:01, 6.83s/it]g-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3593, 'learning_rate': 9.876484560570071e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:03,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1212/17840 [2:02:50<31:27:17, 6.81s/it]g-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1212/17840 [2:02:50<31:27:17, 6.81s/it]g-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1644, 'learning_rate': 9.875890736342042e-05, 'epoch': 1.36} + 7%|████▉ | 1212/17840 [2:02:50<31:27:17, 6.81s/it]g-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1212/17840 [2:02:50<31:27:17, 6.81s/it]g-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1212/17840 [2:02:50<31:27:17, 6.81s/it]g-point operations will not be computed-17 18:43:26,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1213/17840 [2:02:56<31:24:33, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:14,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1213/17840 [2:02:56<31:24:33, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:14,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1213/17840 [2:02:56<31:24:33, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:14,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1214/17840 [2:03:03<31:08:32, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:14,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1214/17840 [2:03:03<31:08:32, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:14,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2118, 'learning_rate': 9.874703087885986e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:23,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:14,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1215/17840 [2:03:10<30:55:12, 6.70s/it]g-point operations will not be computed-17 18:44:14,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1215/17840 [2:03:10<30:55:12, 6.70s/it]g-point operations will not be computed-17 18:44:14,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2686, 'learning_rate': 9.874109263657958e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:30,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:14,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:30,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:14,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:30,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:14,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1294, 'learning_rate': 9.873515439429929e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:30,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:14,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:30,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:14,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:30,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:14,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1217/17840 [2:03:23<30:38:22, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1217/17840 [2:03:23<30:38:22, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1217/17840 [2:03:23<30:38:22, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1218/17840 [2:03:29<30:22:56, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1218/17840 [2:03:29<30:22:56, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:48,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:48,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1219/17840 [2:03:36<30:07:24, 6.52s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1219/17840 [2:03:36<30:07:24, 6.52s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:54,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:44:54,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1220/17840 [2:03:42<29:52:20, 6.47s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1220/17840 [2:03:42<29:52:20, 6.47s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:01,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:01,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1221/17840 [2:03:48<29:39:41, 6.43s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1221/17840 [2:03:48<29:39:41, 6.43s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2594, 'learning_rate': 9.870546318289786e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:08,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1222/17840 [2:03:55<29:26:25, 6.38s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1222/17840 [2:03:55<29:26:25, 6.38s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5888, 'learning_rate': 9.869952494061758e-05, 'epoch': 1.37} + 7%|█████ | 1222/17840 [2:03:55<29:26:25, 6.38s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:16,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:16,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0266, 'learning_rate': 9.869358669833729e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:21,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1224/17840 [2:04:07<29:02:06, 6.29s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1224/17840 [2:04:07<29:02:06, 6.29s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1454, 'learning_rate': 9.868764845605701e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:27,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1225/17840 [2:04:15<31:54:14, 6.91s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1225/17840 [2:04:15<31:54:14, 6.91s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6756, 'learning_rate': 9.868171021377672e-05, 'epoch': 1.37} + 7%|█████ | 1225/17840 [2:04:15<31:54:14, 6.91s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:37,305 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:37,305 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4165, 'learning_rate': 9.867577197149644e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:41,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1227/17840 [2:04:27<29:28:02, 6.39s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1227/17840 [2:04:27<29:28:02, 6.39s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1887, 'learning_rate': 9.866983372921616e-05, 'epoch': 1.38} +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:47,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:47,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1228/17840 [2:04:33<28:31:12, 6.18s/it]g-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:51,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:51,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:51,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:44:40,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1229/17840 [2:04:38<27:45:41, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:45:55,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1229/17840 [2:04:38<27:45:41, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:45:55,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1229/17840 [2:04:38<27:45:41, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:45:55,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:59,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:55,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:45:59,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:55,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:03,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:55,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:03,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:45:55,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1231/17840 [2:04:49<26:17:09, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:46:06,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1231/17840 [2:04:49<26:17:09, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:46:06,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:10,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:06,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:10,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:06,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1811, 'learning_rate': 9.864014251781473e-05, 'epoch': 1.38} +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:14,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:06,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:14,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:06,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1233/17840 [2:04:59<24:41:04, 5.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:18,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:18,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1234/17840 [2:05:04<23:39:12, 5.13s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:22,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:22,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:24,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:26,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:26,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:28,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:30,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:30,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:31,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:33,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:33,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:36,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:36,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:38,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:39,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:39,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:42,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:42,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:44,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:44,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:45,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:45,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:49,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:49,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:49,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:53,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:53,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:46:57,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:00,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:00,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4262, 'learning_rate': 9.856888361045131e-05, 'epoch': 1.39} +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:00,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:00,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:00,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1245/17840 [2:05:52<27:19:27, 5.93s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1245/17840 [2:05:52<27:19:27, 5.93s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1245/17840 [2:05:52<27:19:27, 5.93s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1245/17840 [2:05:52<27:19:27, 5.93s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1245/17840 [2:05:52<27:19:27, 5.93s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1246/17840 [2:06:00<29:11:36, 6.33s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:19,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:19,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1247/17840 [2:06:07<30:31:24, 6.62s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1247/17840 [2:06:07<30:31:24, 6.62s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5314, 'learning_rate': 9.855106888361046e-05, 'epoch': 1.4} + 7%|█████ | 1247/17840 [2:06:07<30:31:24, 6.62s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1247/17840 [2:06:07<30:31:24, 6.62s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1247/17840 [2:06:07<30:31:24, 6.62s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1248/17840 [2:06:14<31:29:46, 6.83s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1248/17840 [2:06:14<31:29:46, 6.83s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:35,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [2:06:21<32:01:16, 6.95s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [2:06:21<32:01:16, 6.95s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2769, 'learning_rate': 9.853919239904988e-05, 'epoch': 1.4} + 7%|█████ | 1249/17840 [2:06:21<32:01:16, 6.95s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [2:06:21<32:01:16, 6.95s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [2:06:21<32:01:16, 6.95s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:06:31<35:41:41, 7.75s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:06:31<35:41:41, 7.75s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:06:31<35:41:41, 7.75s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:06:31<35:41:41, 7.75s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:06:31<35:41:41, 7.75s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1251/17840 [2:06:38<35:03:01, 7.61s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:57,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:47:57,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1252/17840 [2:06:45<34:21:41, 7.46s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1252/17840 [2:06:45<34:21:41, 7.46s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1236, 'learning_rate': 9.852137767220903e-05, 'epoch': 1.4} + 7%|█████ | 1252/17840 [2:06:45<34:21:41, 7.46s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:08,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:08,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2492, 'learning_rate': 9.851543942992875e-05, 'epoch': 1.4} +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:08,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:08,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1254/17840 [2:07:00<33:23:12, 7.25s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1254/17840 [2:07:00<33:23:12, 7.25s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2427, 'learning_rate': 9.850950118764846e-05, 'epoch': 1.41} + 7%|█████▏ | 1254/17840 [2:07:00<33:23:12, 7.25s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:22,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:22,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8141, 'learning_rate': 9.850356294536818e-05, 'epoch': 1.41} +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:22,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:22,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:22,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1256/17840 [2:07:14<32:50:28, 7.13s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:33,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:33,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1257/17840 [2:07:20<32:36:27, 7.08s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1257/17840 [2:07:20<32:36:27, 7.08s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1103, 'learning_rate': 9.84916864608076e-05, 'epoch': 1.41} + 7%|█████▏ | 1257/17840 [2:07:20<32:36:27, 7.08s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1257/17840 [2:07:20<32:36:27, 7.08s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1257/17840 [2:07:20<32:36:27, 7.08s/it]g-point operations will not be computed-17 18:46:16,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1258/17840 [2:07:27<32:16:19, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1258/17840 [2:07:27<32:16:19, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1258/17840 [2:07:27<32:16:19, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1259/17840 [2:07:34<32:06:23, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1259/17840 [2:07:34<32:06:23, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1541, 'learning_rate': 9.847980997624703e-05, 'epoch': 1.41} +[WARNING|modeling_utils.py:388] 2022-03-17 18:48:55,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1260/17840 [2:07:41<31:54:37, 6.93s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1260/17840 [2:07:41<31:54:37, 6.93s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3825, 'learning_rate': 9.847387173396675e-05, 'epoch': 1.41} + 7%|█████▏ | 1260/17840 [2:07:41<31:54:37, 6.93s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:03,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:03,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4763, 'learning_rate': 9.846793349168647e-05, 'epoch': 1.41} +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:03,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:03,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1262/17840 [2:07:55<31:29:09, 6.84s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1262/17840 [2:07:55<31:29:09, 6.84s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4413, 'learning_rate': 9.846199524940618e-05, 'epoch': 1.41} +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:15,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1263/17840 [2:08:01<31:18:09, 6.80s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1263/17840 [2:08:01<31:18:09, 6.80s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0747, 'learning_rate': 9.845605700712589e-05, 'epoch': 1.42} + 7%|█████▏ | 1263/17840 [2:08:01<31:18:09, 6.80s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:23,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:23,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9797, 'learning_rate': 9.845011876484561e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:23,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:23,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:23,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1265/17840 [2:08:14<30:46:59, 6.69s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:33,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:33,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1266/17840 [2:08:21<30:38:15, 6.65s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1266/17840 [2:08:21<30:38:15, 6.65s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3411, 'learning_rate': 9.843824228028504e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:41,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1267/17840 [2:08:28<30:26:09, 6.61s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1267/17840 [2:08:28<30:26:09, 6.61s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0761, 'learning_rate': 9.843230403800476e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:48,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1268/17840 [2:08:34<30:10:38, 6.56s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1268/17840 [2:08:34<30:10:38, 6.56s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2647, 'learning_rate': 9.842636579572448e-05, 'epoch': 1.42} + 7%|█████▏ | 1268/17840 [2:08:34<30:10:38, 6.56s/it]g-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:56,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:56,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2515, 'learning_rate': 9.842042755344418e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:56,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:56,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:49:56,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:48:45,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1270/17840 [2:08:47<29:42:50, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:04,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1270/17840 [2:08:47<29:42:50, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:04,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1270/17840 [2:08:47<29:42:50, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:04,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1270/17840 [2:08:47<29:42:50, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:04,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1271/17840 [2:08:53<29:29:40, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:10,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1271/17840 [2:08:53<29:29:40, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:10,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1271/17840 [2:08:53<29:29:40, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:10,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1271/17840 [2:08:53<29:29:40, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:10,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1272/17840 [2:08:59<29:10:18, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:16,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1272/17840 [2:08:59<29:10:18, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:16,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1272/17840 [2:08:59<29:10:18, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:16,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1272/17840 [2:08:59<29:10:18, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:16,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1273/17840 [2:09:05<28:58:20, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:22,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1273/17840 [2:09:05<28:58:20, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:22,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1273/17840 [2:09:05<28:58:20, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:22,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1273/17840 [2:09:05<28:58:20, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:22,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1274/17840 [2:09:12<28:48:14, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:29,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1274/17840 [2:09:12<28:48:14, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:29,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1274/17840 [2:09:12<28:48:14, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:29,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████��▏ | 1274/17840 [2:09:12<28:48:14, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:29,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1275/17840 [2:09:20<31:32:55, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:29,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:38,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:29,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:38,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:29,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:38,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:29,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1276/17840 [2:09:26<30:23:59, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1276/17840 [2:09:26<30:23:59, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:47,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:47,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5864, 'learning_rate': 9.83729216152019e-05, 'epoch': 1.43} +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:47,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:53,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:53,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3565, 'learning_rate': 9.836698337292161e-05, 'epoch': 1.43} +[WARNING|modeling_utils.py:388] 2022-03-17 18:50:57,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1279/17840 [2:09:43<27:30:38, 5.98s/it]g-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1279/17840 [2:09:43<27:30:38, 5.98s/it]g-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:01,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:04,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:04,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:04,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:08,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1281/17840 [2:09:53<25:55:36, 5.64s/it]g-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1281/17840 [2:09:53<25:55:36, 5.64s/it]g-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:12,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:12,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:50:43,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1282/17840 [2:09:59<25:16:34, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:15,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1282/17840 [2:09:59<25:16:34, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:15,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:18,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:15,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1283/17840 [2:10:04<24:33:01, 5.34s/it]g-point operations will not be computed-17 18:51:15,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1283/17840 [2:10:04<24:33:01, 5.34s/it]g-point operations will not be computed-17 18:51:15,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:22,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:15,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:22,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:15,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:22,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:15,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1284/17840 [2:10:08<23:39:36, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1285/17840 [2:10:13<22:34:58, 4.91s/it]g-point operations will not be computed-17 18:51:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1285/17840 [2:10:13<22:34:58, 4.91s/it]g-point operations will not be computed-17 18:51:25,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1285/17840 [2:10:13<22:34:58, 4.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:29,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1286/17840 [2:10:17<21:21:06, 4.64s/it]g-point operations will not be computed-17 18:51:29,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1286/17840 [2:10:17<21:21:06, 4.64s/it]g-point operations will not be computed-17 18:51:29,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1286/17840 [2:10:17<21:21:06, 4.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:33,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1286/17840 [2:10:17<21:21:06, 4.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:33,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1287/17840 [2:10:20<19:55:06, 4.33s/it]g-point operations will not be computed-17 18:51:33,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1287/17840 [2:10:20<19:55:06, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:37,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1287/17840 [2:10:20<19:55:06, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:37,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1288/17840 [2:10:24<18:33:39, 4.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:40,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:41,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:40,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:41,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:40,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1289/17840 [2:10:27<17:12:35, 3.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:43,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1289/17840 [2:10:27<17:12:35, 3.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:43,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1290/17840 [2:10:29<15:51:30, 3.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:46,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1290/17840 [2:10:29<15:51:30, 3.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:46,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1291/17840 [2:10:32<14:28:15, 3.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:48,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1291/17840 [2:10:32<14:28:15, 3.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:48,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1292/17840 [2:10:34<13:01:18, 2.83s/it]g-point operations will not be computed-17 18:51:48,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1292/17840 [2:10:34<13:01:18, 2.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:52,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1292/17840 [2:10:34<13:01:18, 2.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:52,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:55,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:52,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:51:55,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:52,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1293/17840 [2:10:42<19:49:00, 4.31s/it]g-point operations will not be computed-17 18:51:52,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1293/17840 [2:10:42<19:49:00, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1293/17840 [2:10:42<19:49:00, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:03,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:03,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1294/17840 [2:10:49<24:14:21, 5.27s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1294/17840 [2:10:49<24:14:21, 5.27s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1294/17840 [2:10:49<24:14:21, 5.27s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:12,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:12,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.288, 'learning_rate': 9.826603325415678e-05, 'epoch': 1.45} +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:12,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:12,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:12,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:11:04<29:13:52, 6.36s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:11:04<29:13:52, 6.36s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:11:04<29:13:52, 6.36s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:11:04<29:13:52, 6.36s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:11:04<29:13:52, 6.36s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1297/17840 [2:11:11<30:37:56, 6.67s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:31,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:31,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:31,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:11:19<31:29:39, 6.85s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:11:19<31:29:39, 6.85s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:11:19<31:29:39, 6.85s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:11:19<31:29:39, 6.85s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:11:19<31:29:39, 6.85s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1299/17840 [2:11:26<31:53:14, 6.94s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1299/17840 [2:11:26<31:53:14, 6.94s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:52:47,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1300/17840 [2:11:35<35:27:00, 7.72s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1300/17840 [2:11:35<35:27:00, 7.72s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2686, 'learning_rate': 9.823634204275535e-05, 'epoch': 1.46} + 7%|█████▎ | 1300/17840 [2:11:35<35:27:00, 7.72s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1300/17840 [2:11:35<35:27:00, 7.72s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1300/17840 [2:11:35<35:27:00, 7.72s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [2:11:43<34:54:34, 7.60s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [2:11:43<34:54:34, 7.60s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [2:11:43<34:54:34, 7.60s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:05,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:05,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3299, 'learning_rate': 9.822446555819478e-05, 'epoch': 1.46} +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:05,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:05,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:05,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1303/17840 [2:11:57<33:42:41, 7.34s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1303/17840 [2:11:57<33:42:41, 7.34s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1303/17840 [2:11:57<33:42:41, 7.34s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:19,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:19,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3081, 'learning_rate': 9.82125890736342e-05, 'epoch': 1.46} +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:19,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:19,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:19,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1305/17840 [2:12:11<32:55:48, 7.17s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1305/17840 [2:12:11<32:55:48, 7.17s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:32,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [2:12:18<32:43:43, 7.13s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [2:12:18<32:43:43, 7.13s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1242, 'learning_rate': 9.820071258907365e-05, 'epoch': 1.46} + 7%|█████▎ | 1306/17840 [2:12:18<32:43:43, 7.13s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [2:12:18<32:43:43, 7.13s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [2:12:18<32:43:43, 7.13s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1307/17840 [2:12:25<32:32:48, 7.09s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1307/17840 [2:12:25<32:32:48, 7.09s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:46,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:46,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1308/17840 [2:12:32<32:21:44, 7.05s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1308/17840 [2:12:32<32:21:44, 7.05s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1308/17840 [2:12:32<32:21:44, 7.05s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:54,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:54,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0998, 'learning_rate': 9.818289786223278e-05, 'epoch': 1.47} +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:54,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:54,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:53:54,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1310/17840 [2:12:46<31:52:14, 6.94s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:05,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:05,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:05,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1311/17840 [2:12:52<31:43:22, 6.91s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1311/17840 [2:12:52<31:43:22, 6.91s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:13,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1312/17840 [2:12:59<31:30:41, 6.86s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1312/17840 [2:12:59<31:30:41, 6.86s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6402, 'learning_rate': 9.816508313539193e-05, 'epoch': 1.47} + 7%|█████▎ | 1312/17840 [2:12:59<31:30:41, 6.86s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1312/17840 [2:12:59<31:30:41, 6.86s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1312/17840 [2:12:59<31:30:41, 6.86s/it]g-point operations will not be computed-17 18:51:59,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1313/17840 [2:13:06<31:26:08, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1313/17840 [2:13:06<31:26:08, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1313/17840 [2:13:06<31:26:08, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1313/17840 [2:13:06<31:26:08, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1314/17840 [2:13:13<31:11:11, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1314/17840 [2:13:13<31:11:11, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:33,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1315/17840 [2:13:19<31:10:30, 6.79s/it]g-point operations will not be computed-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1315/17840 [2:13:19<31:10:30, 6.79s/it]g-point operations will not be computed-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1105, 'learning_rate': 9.814726840855108e-05, 'epoch': 1.47} + 7%|█████▍ | 1315/17840 [2:13:19<31:10:30, 6.79s/it]g-point operations will not be computed-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:42,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:42,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0583, 'learning_rate': 9.814133016627078e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:42,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:42,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:42,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:23,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1317/17840 [2:13:33<30:42:37, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1317/17840 [2:13:33<30:42:37, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1317/17840 [2:13:33<30:42:37, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1318/17840 [2:13:39<30:21:34, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1318/17840 [2:13:39<30:21:34, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:58,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:54:58,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1319/17840 [2:13:45<30:01:19, 6.54s/it]g-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1319/17840 [2:13:45<30:01:19, 6.54s/it]g-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.046, 'learning_rate': 9.812351543942993e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:06,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1320/17840 [2:13:52<29:54:40, 6.52s/it]g-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1320/17840 [2:13:52<29:54:40, 6.52s/it]g-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2095, 'learning_rate': 9.811757719714965e-05, 'epoch': 1.48} + 7%|█████▍ | 1320/17840 [2:13:52<29:54:40, 6.52s/it]g-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:14,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:14,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0237, 'learning_rate': 9.811163895486937e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:14,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:20,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:20,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5538, 'learning_rate': 9.810570071258908e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:20,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:26,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:26,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2653, 'learning_rate': 9.80997624703088e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:26,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:33,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:33,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4189, 'learning_rate': 9.80938242280285e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:33,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:33,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1325/17840 [2:14:26<31:48:39, 6.93s/it]g-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1325/17840 [2:14:26<31:48:39, 6.93s/it]g-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2052, 'learning_rate': 9.808788598574821e-05, 'epoch': 1.49} + 7%|█████▍ | 1325/17840 [2:14:26<31:48:39, 6.93s/it]g-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1325/17840 [2:14:26<31:48:39, 6.93s/it]g-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1325/17840 [2:14:26<31:48:39, 6.93s/it]g-point operations will not be computed-17 18:54:50,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1326/17840 [2:14:32<30:36:26, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:55:49,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1326/17840 [2:14:32<30:36:26, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:55:49,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:53,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:55:49,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:53,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:55:49,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3398, 'learning_rate': 9.807600950118765e-05, 'epoch': 1.49} +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:53,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:55:49,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:59,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:55:49,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:55:59,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:55:49,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1952, 'learning_rate': 9.807007125890737e-05, 'epoch': 1.49} +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:03,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:55:49,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1329/17840 [2:14:49<27:48:22, 6.06s/it]g-point operations will not be computed-17 18:55:49,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1329/17840 [2:14:49<27:48:22, 6.06s/it]g-point operations will not be computed-17 18:55:49,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:07,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:55:49,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:07,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:55:49,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1330/17840 [2:14:54<27:07:46, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:11,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1330/17840 [2:14:54<27:07:46, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:11,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0666, 'learning_rate': 9.80581947743468e-05, 'epoch': 1.49} +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:15,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:11,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:15,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:11,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0702, 'learning_rate': 9.80522565320665e-05, 'epoch': 1.49} +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:19,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:11,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:19,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:11,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1332/17840 [2:15:05<25:26:19, 5.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1332/17840 [2:15:05<25:26:19, 5.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1332/17840 [2:15:05<25:26:19, 5.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:25,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:27,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:27,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:30,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:32,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:32,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:34,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:36,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:36,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:38,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:39,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:39,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:41,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:43,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:43,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:46,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:46,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:47,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:50,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:50,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:51,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:51,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:53,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:53,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:54,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:54,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:56:58,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:02,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:02,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6614, 'learning_rate': 9.79809976247031e-05, 'epoch': 1.51} +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:06,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:06,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:06,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:10,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:10,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:10,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:10,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:10,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1345/17840 [2:16:02<27:05:16, 5.91s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1345/17840 [2:16:02<27:05:16, 5.91s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1345/17840 [2:16:02<27:05:16, 5.91s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:25,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:25,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.361, 'learning_rate': 9.796318289786224e-05, 'epoch': 1.51} +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:25,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:25,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:25,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1347/17840 [2:16:16<30:24:51, 6.64s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1347/17840 [2:16:16<30:24:51, 6.64s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1347/17840 [2:16:16<30:24:51, 6.64s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:39,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:39,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3018, 'learning_rate': 9.795130641330167e-05, 'epoch': 1.51} +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:43,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:57:43,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [2:16:31<31:53:02, 6.96s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [2:16:31<31:53:02, 6.96s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0612, 'learning_rate': 9.794536817102138e-05, 'epoch': 1.51} + 8%|█████▌ | 1349/17840 [2:16:31<31:53:02, 6.96s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [2:16:31<31:53:02, 6.96s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [2:16:31<31:53:02, 6.96s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [2:16:41<35:33:48, 7.76s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [2:16:41<35:33:48, 7.76s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [2:16:41<35:33:48, 7.76s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [2:16:41<35:33:48, 7.76s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [2:16:41<35:33:48, 7.76s/it]g-point operations will not be computed-17 18:56:22,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1351/17840 [2:16:48<34:53:43, 7.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1351/17840 [2:16:48<34:53:43, 7.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1351/17840 [2:16:48<34:53:43, 7.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1351/17840 [2:16:48<34:53:43, 7.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1352/17840 [2:16:55<34:16:30, 7.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1352/17840 [2:16:55<34:16:30, 7.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1352/17840 [2:16:55<34:16:30, 7.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:18,114 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:18,114 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2279, 'learning_rate': 9.792161520190025e-05, 'epoch': 1.52} +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:18,114 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:18,114 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:18,114 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1354/17840 [2:17:09<33:17:42, 7.27s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1354/17840 [2:17:09<33:17:42, 7.27s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:30,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:17:16<32:56:23, 7.19s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:17:16<32:56:23, 7.19s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2539, 'learning_rate': 9.790973871733967e-05, 'epoch': 1.52} + 8%|█████▌ | 1355/17840 [2:17:16<32:56:23, 7.19s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:17:16<32:56:23, 7.19s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:17:16<32:56:23, 7.19s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1356/17840 [2:17:23<32:45:21, 7.15s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:42,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:42,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1357/17840 [2:17:30<32:27:35, 7.09s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1357/17840 [2:17:30<32:27:35, 7.09s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2214, 'learning_rate': 9.78978622327791e-05, 'epoch': 1.52} + 8%|█████▌ | 1357/17840 [2:17:30<32:27:35, 7.09s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:53,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:53,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6161, 'learning_rate': 9.789192399049881e-05, 'epoch': 1.52} +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:53,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:53,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:58:53,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1359/17840 [2:17:44<31:55:10, 6.97s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:03,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:03,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1360/17840 [2:17:51<31:45:36, 6.94s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1360/17840 [2:17:51<31:45:36, 6.94s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0119, 'learning_rate': 9.788004750593825e-05, 'epoch': 1.52} +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:11,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1361/17840 [2:17:58<31:31:08, 6.89s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1361/17840 [2:17:58<31:31:08, 6.89s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1241, 'learning_rate': 9.787410926365797e-05, 'epoch': 1.53} + 8%|█████▌ | 1361/17840 [2:17:58<31:31:08, 6.89s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1361/17840 [2:17:58<31:31:08, 6.89s/it]g-point operations will not be computed-17 18:58:05,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1362/17840 [2:18:04<31:31:25, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:59:22,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1362/17840 [2:18:04<31:31:25, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:59:22,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:25,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:22,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1363/17840 [2:18:11<31:13:32, 6.82s/it]g-point operations will not be computed-17 18:59:22,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1363/17840 [2:18:11<31:13:32, 6.82s/it]g-point operations will not be computed-17 18:59:22,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2229, 'learning_rate': 9.78622327790974e-05, 'epoch': 1.53} + 8%|█████▌ | 1363/17840 [2:18:11<31:13:32, 6.82s/it]g-point operations will not be computed-17 18:59:22,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:33,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:22,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:33,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:22,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1874, 'learning_rate': 9.78562945368171e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:33,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:22,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:40,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:22,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:40,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:22,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6125, 'learning_rate': 9.785035629453682e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:40,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:22,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:40,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:22,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:40,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:22,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1366/17840 [2:18:31<30:27:54, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1366/17840 [2:18:31<30:27:54, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1366/17840 [2:18:31<30:27:54, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1366/17840 [2:18:31<30:27:54, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1367/17840 [2:18:37<30:11:50, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:56,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:56,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 18:59:56,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1368/17840 [2:18:44<29:53:18, 6.53s/it]g-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1368/17840 [2:18:44<29:53:18, 6.53s/it]g-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:04,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:04,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1369/17840 [2:18:50<29:46:01, 6.51s/it]g-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1369/17840 [2:18:50<29:46:01, 6.51s/it]g-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1369/17840 [2:18:50<29:46:01, 6.51s/it]g-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1369/17840 [2:18:50<29:46:01, 6.51s/it]g-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:12,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:12,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:12,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:12,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:18,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:18,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:18,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:25,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:25,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2006, 'learning_rate': 9.780878859857482e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:25,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:31,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:31,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2832, 'learning_rate': 9.780285035629454e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:31,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:37,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:37,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0783, 'learning_rate': 9.779691211401426e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:37,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:37,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1375/17840 [2:19:30<31:18:52, 6.85s/it]g-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1375/17840 [2:19:30<31:18:52, 6.85s/it]g-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2907, 'learning_rate': 9.779097387173397e-05, 'epoch': 1.54} + 8%|█████▋ | 1375/17840 [2:19:30<31:18:52, 6.85s/it]g-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:51,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:51,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2369, 'learning_rate': 9.778503562945369e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:55,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:00:55,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1377/17840 [2:19:41<28:54:03, 6.32s/it]g-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1377/17840 [2:19:41<28:54:03, 6.32s/it]g-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:01,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:01,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1378/17840 [2:19:47<28:02:56, 6.13s/it]g-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:05,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:05,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:05,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1379/17840 [2:19:53<27:19:10, 5.97s/it]g-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:11,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:14,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:14,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0867, 'learning_rate': 9.776128266033255e-05, 'epoch': 1.55} +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:14,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:14,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:19,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:21,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:21,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:21,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 18:59:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1382/17840 [2:20:08<25:05:32, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:28,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:28,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1383/17840 [2:20:13<24:06:15, 5.27s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:31,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:31,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:33,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:35,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:35,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:37,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:39,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:39,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:41,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:43,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:43,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:46,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:48,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:48,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:51,272 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:51,272 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:52,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:52,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:54,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:54,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:57,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:58,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:01:58,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4009, 'learning_rate': 9.769002375296912e-05, 'epoch': 1.56} +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:02,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:02,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:02,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:06,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:06,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:09,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:09,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:09,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:13,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:13,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:13,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:21,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:21,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0823, 'learning_rate': 9.767220902612827e-05, 'epoch': 1.56} +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:21,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:21,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1396/17840 [2:21:13<29:23:22, 6.43s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1396/17840 [2:21:13<29:23:22, 6.43s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2251, 'learning_rate': 9.766627078384799e-05, 'epoch': 1.57} + 8%|█████▋ | 1396/17840 [2:21:13<29:23:22, 6.43s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1396/17840 [2:21:13<29:23:22, 6.43s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1396/17840 [2:21:13<29:23:22, 6.43s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1397/17840 [2:21:20<30:37:25, 6.70s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1397/17840 [2:21:20<30:37:25, 6.70s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:02:41,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1398/17840 [2:21:28<31:33:49, 6.91s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1398/17840 [2:21:28<31:33:49, 6.91s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1292, 'learning_rate': 9.76543942992874e-05, 'epoch': 1.57} + 8%|█████▋ | 1398/17840 [2:21:28<31:33:49, 6.91s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1398/17840 [2:21:28<31:33:49, 6.91s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1399/17840 [2:21:35<32:14:50, 7.06s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1399/17840 [2:21:35<32:14:50, 7.06s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0614, 'learning_rate': 9.764845605700714e-05, 'epoch': 1.57} + 8%|█████▋ | 1399/17840 [2:21:35<32:14:50, 7.06s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1399/17840 [2:21:35<32:14:50, 7.06s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1399/17840 [2:21:35<32:14:50, 7.06s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1400/17840 [2:21:45<35:53:39, 7.86s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1400/17840 [2:21:45<35:53:39, 7.86s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1400/17840 [2:21:45<35:53:39, 7.86s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:07,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:07,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1205, 'learning_rate': 9.763657957244657e-05, 'epoch': 1.57} +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:07,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:07,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1402/17840 [2:21:59<34:24:35, 7.54s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1402/17840 [2:21:59<34:24:35, 7.54s/it]g-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9216, 'learning_rate': 9.763064133016627e-05, 'epoch': 1.57} +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:20,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:20,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:01:25,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1403/17840 [2:22:06<33:53:41, 7.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1403/17840 [2:22:06<33:53:41, 7.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1403/17840 [2:22:06<33:53:41, 7.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1403/17840 [2:22:06<33:53:41, 7.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1404/17840 [2:22:13<33:23:21, 7.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1404/17840 [2:22:13<33:23:21, 7.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:34,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1405/17840 [2:22:20<32:57:17, 7.22s/it]g-point operations will not be computed-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1405/17840 [2:22:20<32:57:17, 7.22s/it]g-point operations will not be computed-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9617, 'learning_rate': 9.761282660332542e-05, 'epoch': 1.58} + 8%|█████▋ | 1405/17840 [2:22:20<32:57:17, 7.22s/it]g-point operations will not be computed-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1405/17840 [2:22:20<32:57:17, 7.22s/it]g-point operations will not be computed-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1405/17840 [2:22:20<32:57:17, 7.22s/it]g-point operations will not be computed-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:22:27<32:37:05, 7.15s/it]g-point operations will not be computed-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:22:27<32:37:05, 7.15s/it]g-point operations will not be computed-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:03:48,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1407/17840 [2:22:34<32:18:32, 7.08s/it]g-point operations will not be computed-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1407/17840 [2:22:34<32:18:32, 7.08s/it]g-point operations will not be computed-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1231, 'learning_rate': 9.760095011876486e-05, 'epoch': 1.58} + 8%|█████▊ | 1407/17840 [2:22:34<32:18:32, 7.08s/it]g-point operations will not be computed-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1407/17840 [2:22:34<32:18:32, 7.08s/it]g-point operations will not be computed-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1407/17840 [2:22:34<32:18:32, 7.08s/it]g-point operations will not be computed-17 19:03:24,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:22:41<32:04:38, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:22:41<32:04:38, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:22:41<32:04:38, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:22:41<32:04:38, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1409/17840 [2:22:48<31:52:23, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1409/17840 [2:22:48<31:52:23, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1409/17840 [2:22:48<31:52:23, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:10,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:10,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2489, 'learning_rate': 9.7583135391924e-05, 'epoch': 1.58} +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:10,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:10,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:10,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1411/17840 [2:23:02<31:27:30, 6.89s/it]g-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:21,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:21,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1412/17840 [2:23:08<31:16:12, 6.85s/it]g-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1412/17840 [2:23:08<31:16:12, 6.85s/it]g-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2001, 'learning_rate': 9.757125890736342e-05, 'epoch': 1.58} +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:29,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1413/17840 [2:23:15<31:03:22, 6.81s/it]g-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1413/17840 [2:23:15<31:03:22, 6.81s/it]g-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1465, 'learning_rate': 9.756532066508314e-05, 'epoch': 1.58} + 8%|█████▊ | 1413/17840 [2:23:15<31:03:22, 6.81s/it]g-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:37,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:37,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1182, 'learning_rate': 9.755938242280286e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:37,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:37,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:37,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1415/17840 [2:23:28<30:41:55, 6.73s/it]g-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:47,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:47,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1416/17840 [2:23:35<30:30:51, 6.69s/it]g-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1416/17840 [2:23:35<30:30:51, 6.69s/it]g-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9943, 'learning_rate': 9.754750593824229e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:55,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:55,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:55,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9622, 'learning_rate': 9.7541567695962e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:55,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:55,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:04:55,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:03:58,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1418/17840 [2:23:48<30:13:19, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1418/17840 [2:23:48<30:13:19, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1418/17840 [2:23:48<30:13:19, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1418/17840 [2:23:48<30:13:19, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1419/17840 [2:23:55<30:10:13, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:13,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:13,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:13,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1420/17840 [2:24:01<29:52:21, 6.55s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:20,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:20,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:20,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1421/17840 [2:24:07<29:32:04, 6.48s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:26,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:26,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1422/17840 [2:24:14<29:16:48, 6.42s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1422/17840 [2:24:14<29:16:48, 6.42s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:32,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:32,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1423/17840 [2:24:20<28:56:08, 6.35s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1423/17840 [2:24:20<28:56:08, 6.35s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1372, 'learning_rate': 9.750593824228029e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:40,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1424/17840 [2:24:26<28:47:20, 6.31s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1424/17840 [2:24:26<28:47:20, 6.31s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.122, 'learning_rate': 9.75e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:46,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1425/17840 [2:24:35<31:46:12, 6.97s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1425/17840 [2:24:35<31:46:12, 6.97s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0294, 'learning_rate': 9.749406175771972e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-17 19:05:55,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1426/17840 [2:24:41<30:33:57, 6.70s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1426/17840 [2:24:41<30:33:57, 6.70s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9828, 'learning_rate': 9.748812351543944e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:01,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1427/17840 [2:24:47<29:18:36, 6.43s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1427/17840 [2:24:47<29:18:36, 6.43s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1129, 'learning_rate': 9.748218527315916e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:06,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:06,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1428/17840 [2:24:52<28:19:52, 6.21s/it]g-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:11,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:11,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:11,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:05:05,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1429/17840 [2:24:58<27:32:15, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:06:15,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1429/17840 [2:24:58<27:32:15, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:06:15,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:19,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:15,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:19,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:15,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1809, 'learning_rate': 9.74643705463183e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:19,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:15,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:15,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:24,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:15,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2948, 'learning_rate': 9.7458432304038e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:28,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:15,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:28,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:15,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1432/17840 [2:25:14<25:23:04, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:06:31,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1432/17840 [2:25:14<25:23:04, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:06:31,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:34,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:31,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:34,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:31,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:37,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:31,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:39,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:31,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:39,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:31,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2072, 'learning_rate': 9.744061757719716e-05, 'epoch': 1.61} +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:42,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:31,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:42,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:31,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1435/17840 [2:25:28<22:20:23, 4.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:06:44,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:46,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:46,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:44,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1436/17840 [2:25:32<21:04:44, 4.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:06:48,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1437/17840 [2:25:35<19:41:42, 4.32s/it]g-point operations will not be computed-17 19:06:48,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1437/17840 [2:25:35<19:41:42, 4.32s/it]g-point operations will not be computed-17 19:06:48,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:53,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:52,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:53,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:52,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1438/17840 [2:25:39<18:08:29, 3.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:06:55,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1439/17840 [2:25:42<16:48:39, 3.69s/it]g-point operations will not be computed-17 19:06:55,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1439/17840 [2:25:42<16:48:39, 3.69s/it]g-point operations will not be computed-17 19:06:55,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:59,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:58,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:06:59,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:06:58,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:01,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:00,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:01,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:00,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1441/17840 [2:25:47<13:53:22, 3.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:03,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1441/17840 [2:25:47<13:53:22, 3.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:03,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1442/17840 [2:25:49<12:37:01, 2.77s/it]g-point operations will not be computed-17 19:07:03,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1442/17840 [2:25:49<12:37:01, 2.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:06,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1442/17840 [2:25:49<12:37:01, 2.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:06,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:10,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:06,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:10,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:06,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1443/17840 [2:25:56<19:28:31, 4.28s/it]g-point operations will not be computed-17 19:07:06,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1443/17840 [2:25:56<19:28:31, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:14,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:18,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:14,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1444/17840 [2:26:04<24:01:20, 5.27s/it]g-point operations will not be computed-17 19:07:14,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1444/17840 [2:26:04<24:01:20, 5.27s/it]g-point operations will not be computed-17 19:07:14,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1444/17840 [2:26:04<24:01:20, 5.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:21,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1444/17840 [2:26:04<24:01:20, 5.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:21,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1444/17840 [2:26:04<24:01:20, 5.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:21,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1445/17840 [2:26:12<27:02:58, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:21,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1445/17840 [2:26:12<27:02:58, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:21,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3712, 'learning_rate': 9.737529691211402e-05, 'epoch': 1.62} + 8%|█████▉ | 1445/17840 [2:26:12<27:02:58, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:21,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1445/17840 [2:26:12<27:02:58, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:21,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1445/17840 [2:26:12<27:02:58, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:21,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1446/17840 [2:26:19<28:53:22, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1446/17840 [2:26:19<28:53:22, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1446/17840 [2:26:19<28:53:22, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:26:26<30:21:04, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:26:26<30:21:04, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0243, 'learning_rate': 9.736342042755346e-05, 'epoch': 1.62} + 8%|█████▉ | 1447/17840 [2:26:26<30:21:04, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:26:26<30:21:04, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:26:26<30:21:04, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1448/17840 [2:26:34<31:11:58, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1448/17840 [2:26:34<31:11:58, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:07:54,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:26:41<31:36:46, 6.94s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:26:41<31:36:46, 6.94s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9775, 'learning_rate': 9.735154394299287e-05, 'epoch': 1.62} + 8%|█████▉ | 1449/17840 [2:26:41<31:36:46, 6.94s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:26:41<31:36:46, 6.94s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1450/17840 [2:26:50<35:15:00, 7.74s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1450/17840 [2:26:50<35:15:00, 7.74s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1188, 'learning_rate': 9.734560570071259e-05, 'epoch': 1.63} + 8%|█████▉ | 1450/17840 [2:26:50<35:15:00, 7.74s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:13,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:13,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3863, 'learning_rate': 9.73396674584323e-05, 'epoch': 1.63} +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:17,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:17,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1452/17840 [2:27:05<33:59:44, 7.47s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1452/17840 [2:27:05<33:59:44, 7.47s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2514, 'learning_rate': 9.733372921615202e-05, 'epoch': 1.63} + 8%|█████▉ | 1452/17840 [2:27:05<33:59:44, 7.47s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1452/17840 [2:27:05<33:59:44, 7.47s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:27:12<33:29:38, 7.36s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:27:12<33:29:38, 7.36s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:31,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:31,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1454/17840 [2:27:19<33:02:11, 7.26s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1454/17840 [2:27:19<33:02:11, 7.26s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0425, 'learning_rate': 9.732185273159146e-05, 'epoch': 1.63} + 8%|█████▉ | 1454/17840 [2:27:19<33:02:11, 7.26s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:41,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:41,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3041, 'learning_rate': 9.731591448931117e-05, 'epoch': 1.63} +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:41,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:41,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1456/17840 [2:27:33<32:23:55, 7.12s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1456/17840 [2:27:33<32:23:55, 7.12s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0884, 'learning_rate': 9.730997624703089e-05, 'epoch': 1.63} + 8%|█████▉ | 1456/17840 [2:27:33<32:23:55, 7.12s/it]g-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:55,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:55,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9956, 'learning_rate': 9.73040380047506e-05, 'epoch': 1.63} +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:55,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:08:55,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:07:36,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1458/17840 [2:27:46<31:46:30, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1458/17840 [2:27:46<31:46:30, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8456, 'learning_rate': 9.729809976247031e-05, 'epoch': 1.63} + 8%|█████▉ | 1458/17840 [2:27:46<31:46:30, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1459/17840 [2:27:53<31:34:32, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1459/17840 [2:27:53<31:34:32, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0954, 'learning_rate': 9.729216152019003e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:14,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1460/17840 [2:28:00<31:18:05, 6.88s/it]g-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1460/17840 [2:28:00<31:18:05, 6.88s/it]g-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1713, 'learning_rate': 9.728622327790974e-05, 'epoch': 1.64} + 8%|█████▉ | 1460/17840 [2:28:00<31:18:05, 6.88s/it]g-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1460/17840 [2:28:00<31:18:05, 6.88s/it]g-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1461/17840 [2:28:07<31:10:53, 6.85s/it]g-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1461/17840 [2:28:07<31:10:53, 6.85s/it]g-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:26,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:26,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1462/17840 [2:28:14<31:09:57, 6.85s/it]g-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1462/17840 [2:28:14<31:09:57, 6.85s/it]g-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2493, 'learning_rate': 9.727434679334917e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:34,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1463/17840 [2:28:20<30:50:14, 6.78s/it]g-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1463/17840 [2:28:20<30:50:14, 6.78s/it]g-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0548, 'learning_rate': 9.726840855106889e-05, 'epoch': 1.64} + 8%|█████▉ | 1463/17840 [2:28:20<30:50:14, 6.78s/it]g-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1463/17840 [2:28:20<30:50:14, 6.78s/it]g-point operations will not be computed-17 19:09:04,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1464/17840 [2:28:27<30:42:50, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:09:44,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1464/17840 [2:28:27<30:42:50, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:09:44,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7875, 'learning_rate': 9.72624703087886e-05, 'epoch': 1.64} + 8%|█████▉ | 1464/17840 [2:28:27<30:42:50, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:09:44,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1465/17840 [2:28:34<30:34:16, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:09:44,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1465/17840 [2:28:34<30:34:16, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:09:44,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2812, 'learning_rate': 9.725653206650832e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-17 19:09:54,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:09:44,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1466/17840 [2:28:40<30:12:53, 6.64s/it]g-point operations will not be computed-17 19:09:44,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1466/17840 [2:28:40<30:12:53, 6.64s/it]g-point operations will not be computed-17 19:09:44,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2252, 'learning_rate': 9.725059382422804e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:01,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:09:44,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1467/17840 [2:28:47<30:03:38, 6.61s/it]g-point operations will not be computed-17 19:09:44,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1467/17840 [2:28:47<30:03:38, 6.61s/it]g-point operations will not be computed-17 19:09:44,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1111, 'learning_rate': 9.724465558194776e-05, 'epoch': 1.64} + 8%|██████ | 1467/17840 [2:28:47<30:03:38, 6.61s/it]g-point operations will not be computed-17 19:09:44,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1467/17840 [2:28:47<30:03:38, 6.61s/it]g-point operations will not be computed-17 19:09:44,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1467/17840 [2:28:47<30:03:38, 6.61s/it]g-point operations will not be computed-17 19:09:44,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1468/17840 [2:28:53<29:56:59, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:10:10,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1468/17840 [2:28:53<29:56:59, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:10:10,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1468/17840 [2:28:53<29:56:59, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:10:10,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1469/17840 [2:29:00<29:41:12, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1469/17840 [2:29:00<29:41:12, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1263, 'learning_rate': 9.723277909738718e-05, 'epoch': 1.65} + 8%|██████ | 1469/17840 [2:29:00<29:41:12, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1470/17840 [2:29:06<29:30:48, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1470/17840 [2:29:06<29:30:48, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:25,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:25,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1471/17840 [2:29:12<29:17:28, 6.44s/it]g-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1471/17840 [2:29:12<29:17:28, 6.44s/it]g-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0881, 'learning_rate': 9.72209026128266e-05, 'epoch': 1.65} +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:32,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1472/17840 [2:29:18<28:55:39, 6.36s/it]g-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1472/17840 [2:29:18<28:55:39, 6.36s/it]g-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5077, 'learning_rate': 9.721496437054632e-05, 'epoch': 1.65} +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:39,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1473/17840 [2:29:25<28:39:20, 6.30s/it]g-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1473/17840 [2:29:25<28:39:20, 6.30s/it]g-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9797, 'learning_rate': 9.720902612826604e-05, 'epoch': 1.65} +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:45,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1474/17840 [2:29:31<28:24:28, 6.25s/it]g-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1474/17840 [2:29:31<28:24:28, 6.25s/it]g-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0126, 'learning_rate': 9.720308788598576e-05, 'epoch': 1.65} +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:51,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:51,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1475/17840 [2:29:39<31:08:01, 6.85s/it]g-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1475/17840 [2:29:39<31:08:01, 6.85s/it]g-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:59,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:10:59,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1476/17840 [2:29:45<29:49:45, 6.56s/it]g-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:03,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:03,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:03,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:10:17,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1477/17840 [2:29:51<28:39:16, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:08,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1477/17840 [2:29:51<28:39:16, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:08,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:12,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:08,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:12,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:08,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0524, 'learning_rate': 9.717933491686461e-05, 'epoch': 1.66} +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:12,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:08,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:12,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:08,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:17,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:08,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:20,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:08,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:20,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:08,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:20,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:08,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1480/17840 [2:30:07<26:08:30, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:24,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1480/17840 [2:30:07<26:08:30, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:24,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1480/17840 [2:30:07<26:08:30, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:24,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:28,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:24,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:28,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:24,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:32,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:24,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:32,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:24,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1482/17840 [2:30:17<24:41:36, 5.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:37,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:37,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1483/17840 [2:30:22<23:55:09, 5.26s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:40,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:42,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:42,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:45,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:47,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:47,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:49,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:51,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:51,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:53,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:54,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:54,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:56,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:56,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:11:58,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:01,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:01,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:02,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:02,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:05,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:05,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:07,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:07,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:08,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:08,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:12,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:12,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:12,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:16,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:16,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:20,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:20,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:20,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1494/17840 [2:31:08<24:07:17, 5.31s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1494/17840 [2:31:08<24:07:17, 5.31s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1494/17840 [2:31:08<24:07:17, 5.31s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1494/17840 [2:31:08<24:07:17, 5.31s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1494/17840 [2:31:08<24:07:17, 5.31s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1495/17840 [2:31:16<27:14:42, 6.00s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:35,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:35,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:35,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:31:23<28:56:54, 6.38s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:31:23<28:56:54, 6.38s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:31:23<28:56:54, 6.38s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:31:23<28:56:54, 6.38s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:31:23<28:56:54, 6.38s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1497/17840 [2:31:30<30:10:34, 6.65s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:49,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:12:49,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1498/17840 [2:31:38<31:12:19, 6.87s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1498/17840 [2:31:38<31:12:19, 6.87s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2425, 'learning_rate': 9.706057007125891e-05, 'epoch': 1.68} + 8%|██████▏ | 1498/17840 [2:31:38<31:12:19, 6.87s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1498/17840 [2:31:38<31:12:19, 6.87s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1498/17840 [2:31:38<31:12:19, 6.87s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1499/17840 [2:31:45<31:43:01, 6.99s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1499/17840 [2:31:45<31:43:01, 6.99s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:06,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0176, 'learning_rate': 9.704869358669835e-05, 'epoch': 1.68} + g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1501/17840 [2:32:02<34:42:19, 7.65s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1501/17840 [2:32:02<34:42:19, 7.65s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5377, 'learning_rate': 9.704275534441806e-05, 'epoch': 1.68} + 8%|██████▏ | 1501/17840 [2:32:02<34:42:19, 7.65s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:24,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:24,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4229, 'learning_rate': 9.703681710213777e-05, 'epoch': 1.68} +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:24,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:24,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:24,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1503/17840 [2:32:16<33:12:36, 7.32s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1503/17840 [2:32:16<33:12:36, 7.32s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:37,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1504/17840 [2:32:23<32:48:38, 7.23s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1504/17840 [2:32:23<32:48:38, 7.23s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1397, 'learning_rate': 9.702494061757719e-05, 'epoch': 1.69} + 8%|██████▏ | 1504/17840 [2:32:23<32:48:38, 7.23s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1504/17840 [2:32:23<32:48:38, 7.23s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1504/17840 [2:32:23<32:48:38, 7.23s/it]g-point operations will not be computed-17 19:11:34,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1505/17840 [2:32:30<32:23:54, 7.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1505/17840 [2:32:30<32:23:54, 7.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1505/17840 [2:32:30<32:23:54, 7.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1506/17840 [2:32:37<32:08:38, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1506/17840 [2:32:37<32:08:38, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0408, 'learning_rate': 9.701306413301663e-05, 'epoch': 1.69} + 8%|██████▏ | 1506/17840 [2:32:37<32:08:38, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:59,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:59,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.229, 'learning_rate': 9.700712589073635e-05, 'epoch': 1.69} +[WARNING|modeling_utils.py:388] 2022-03-17 19:13:59,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:06,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:06,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:06,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:09,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:09,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1509/17840 [2:32:57<31:14:58, 6.89s/it]g-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1509/17840 [2:32:57<31:14:58, 6.89s/it]g-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:16,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:16,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:16,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1510/17840 [2:33:04<31:01:07, 6.84s/it]g-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1510/17840 [2:33:04<31:01:07, 6.84s/it]g-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1510/17840 [2:33:04<31:01:07, 6.84s/it]g-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1510/17840 [2:33:04<31:01:07, 6.84s/it]g-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1510/17840 [2:33:04<31:01:07, 6.84s/it]g-point operations will not be computed-17 19:13:47,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1511/17840 [2:33:11<30:54:23, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1511/17840 [2:33:11<30:54:23, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1511/17840 [2:33:11<30:54:23, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1511/17840 [2:33:11<30:54:23, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1512/17840 [2:33:17<30:50:56, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1512/17840 [2:33:17<30:50:56, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:38,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:38,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1513/17840 [2:33:24<30:42:00, 6.77s/it]g-point operations will not be computed-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1513/17840 [2:33:24<30:42:00, 6.77s/it]g-point operations will not be computed-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1513/17840 [2:33:24<30:42:00, 6.77s/it]g-point operations will not be computed-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:46,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:46,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6139, 'learning_rate': 9.696555819477436e-05, 'epoch': 1.7} +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:46,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:46,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:14:46,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:28,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1515/17840 [2:33:37<30:26:35, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1515/17840 [2:33:37<30:26:35, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1515/17840 [2:33:37<30:26:35, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1515/17840 [2:33:37<30:26:35, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1516/17840 [2:33:44<30:11:27, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:03,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:03,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:03,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1517/17840 [2:33:51<30:04:39, 6.63s/it]g-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:09,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:12,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:12,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1225, 'learning_rate': 9.694180522565321e-05, 'epoch': 1.7} +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:12,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:19,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:19,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0524, 'learning_rate': 9.693586698337293e-05, 'epoch': 1.7} +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:19,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:25,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:25,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1141, 'learning_rate': 9.692992874109265e-05, 'epoch': 1.7} +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:25,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:31,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:31,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1484, 'learning_rate': 9.692399049881236e-05, 'epoch': 1.71} +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:31,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:38,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:38,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.224, 'learning_rate': 9.691805225653206e-05, 'epoch': 1.71} +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:38,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:44,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:44,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0, 'learning_rate': 9.691211401425179e-05, 'epoch': 1.71} +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:44,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:50,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:50,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3628, 'learning_rate': 9.690617577197149e-05, 'epoch': 1.71} +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:50,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:50,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:15:50,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1525/17840 [2:34:43<31:10:17, 6.88s/it]g-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:01,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:01,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:01,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:14:55,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1526/17840 [2:34:49<29:55:05, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:06,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1526/17840 [2:34:49<29:55:05, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:06,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:10,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:10,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4084, 'learning_rate': 9.688836104513065e-05, 'epoch': 1.71} +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:10,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:16,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:16,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1671, 'learning_rate': 9.688242280285036e-05, 'epoch': 1.71} +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:20,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1529/17840 [2:35:06<27:20:04, 6.03s/it]g-point operations will not be computed-17 19:16:06,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1529/17840 [2:35:06<27:20:04, 6.03s/it]g-point operations will not be computed-17 19:16:06,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:24,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:24,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:24,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:06,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1530/17840 [2:35:12<26:36:11, 5.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:28,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1530/17840 [2:35:12<26:36:11, 5.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:28,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:32,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:28,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:32,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:28,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1601, 'learning_rate': 9.686460807600951e-05, 'epoch': 1.72} +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:36,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:28,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:36,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:28,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1532/17840 [2:35:22<25:03:43, 5.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:39,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1532/17840 [2:35:22<25:03:43, 5.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:39,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:42,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:39,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:42,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:39,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:45,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:39,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:45,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:39,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:45,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:39,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1534/17840 [2:35:32<23:17:54, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:48,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:50,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:48,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:50,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:48,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1535/17840 [2:35:36<22:09:14, 4.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:52,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:54,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:52,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:16:54,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:16:52,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1536/17840 [2:35:40<20:53:14, 4.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:16:56,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1537/17840 [2:35:43<19:34:05, 4.32s/it]g-point operations will not be computed-17 19:16:56,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1537/17840 [2:35:43<19:34:05, 4.32s/it]g-point operations will not be computed-17 19:16:56,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1537/17840 [2:35:43<19:34:05, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:17:00,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1538/17840 [2:35:47<18:08:51, 4.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:17:03,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1538/17840 [2:35:47<18:08:51, 4.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:17:03,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1539/17840 [2:35:50<16:40:36, 3.68s/it]g-point operations will not be computed-17 19:17:03,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1539/17840 [2:35:50<16:40:36, 3.68s/it]g-point operations will not be computed-17 19:17:03,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:07,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:06,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:07,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:06,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1540/17840 [2:35:52<15:16:24, 3.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:17:08,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1541/17840 [2:35:55<13:56:58, 3.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:17:11,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1541/17840 [2:35:55<13:56:58, 3.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:17:11,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1542/17840 [2:35:57<12:38:06, 2.79s/it]g-point operations will not be computed-17 19:17:11,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1542/17840 [2:35:57<12:38:06, 2.79s/it]g-point operations will not be computed-17 19:17:11,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1542/17840 [2:35:57<12:38:06, 2.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:17:14,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1542/17840 [2:35:57<12:38:06, 2.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:17:14,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:18,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:14,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1543/17840 [2:36:05<19:29:27, 4.31s/it]g-point operations will not be computed-17 19:17:14,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1543/17840 [2:36:05<19:29:27, 4.31s/it]g-point operations will not be computed-17 19:17:14,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1543/17840 [2:36:05<19:29:27, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1543/17840 [2:36:05<19:29:27, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:26,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:26,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1544/17840 [2:36:12<24:09:03, 5.34s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1544/17840 [2:36:12<24:09:03, 5.34s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1544/17840 [2:36:12<24:09:03, 5.34s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1544/17840 [2:36:12<24:09:03, 5.34s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1544/17840 [2:36:12<24:09:03, 5.34s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1545/17840 [2:36:20<27:07:15, 5.99s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1545/17840 [2:36:20<27:07:15, 5.99s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1546/17840 [2:36:27<29:03:56, 6.42s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1546/17840 [2:36:27<29:03:56, 6.42s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1831, 'learning_rate': 9.677553444180523e-05, 'epoch': 1.73} + 9%|██████▎ | 1546/17840 [2:36:27<29:03:56, 6.42s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1546/17840 [2:36:27<29:03:56, 6.42s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1546/17840 [2:36:27<29:03:56, 6.42s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1547/17840 [2:36:35<30:22:00, 6.71s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1547/17840 [2:36:35<30:22:00, 6.71s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1547/17840 [2:36:35<30:22:00, 6.71s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:58,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:58,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0339, 'learning_rate': 9.676365795724466e-05, 'epoch': 1.74} +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:58,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:58,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:17:58,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1549/17840 [2:36:49<31:44:56, 7.02s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1549/17840 [2:36:49<31:44:56, 7.02s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1549/17840 [2:36:49<31:44:56, 7.02s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1549/17840 [2:36:49<31:44:56, 7.02s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1549/17840 [2:36:49<31:44:56, 7.02s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1550/17840 [2:36:59<35:15:33, 7.79s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1550/17840 [2:36:59<35:15:33, 7.79s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:18:20,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1551/17840 [2:37:06<34:34:46, 7.64s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1551/17840 [2:37:06<34:34:46, 7.64s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1055, 'learning_rate': 9.67458432304038e-05, 'epoch': 1.74} + 9%|██████▎ | 1551/17840 [2:37:06<34:34:46, 7.64s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1551/17840 [2:37:06<34:34:46, 7.64s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1552/17840 [2:37:13<33:57:38, 7.51s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1552/17840 [2:37:13<33:57:38, 7.51s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7728, 'learning_rate': 9.673990498812353e-05, 'epoch': 1.74} +[WARNING|modeling_utils.py:388] 2022-03-17 19:18:34,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1553/17840 [2:37:20<33:18:10, 7.36s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1553/17840 [2:37:20<33:18:10, 7.36s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1316, 'learning_rate': 9.673396674584323e-05, 'epoch': 1.74} + 9%|██████▎ | 1553/17840 [2:37:20<33:18:10, 7.36s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1553/17840 [2:37:20<33:18:10, 7.36s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1553/17840 [2:37:20<33:18:10, 7.36s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1554/17840 [2:37:28<33:00:25, 7.30s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:18:47,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:18:47,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1555/17840 [2:37:35<32:41:30, 7.23s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1555/17840 [2:37:35<32:41:30, 7.23s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1676, 'learning_rate': 9.672209026128266e-05, 'epoch': 1.74} + 9%|██████▎ | 1555/17840 [2:37:35<32:41:30, 7.23s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1555/17840 [2:37:35<32:41:30, 7.23s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1555/17840 [2:37:35<32:41:30, 7.23s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1556/17840 [2:37:42<32:18:19, 7.14s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:01,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:01,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1557/17840 [2:37:49<31:57:52, 7.07s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1557/17840 [2:37:49<31:57:52, 7.07s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1863, 'learning_rate': 9.671021377672209e-05, 'epoch': 1.75} + 9%|██████▎ | 1557/17840 [2:37:49<31:57:52, 7.07s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:11,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:11,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2368, 'learning_rate': 9.670427553444181e-05, 'epoch': 1.75} +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:11,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:11,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:11,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1559/17840 [2:38:02<31:27:09, 6.95s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:21,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:21,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1560/17840 [2:38:09<31:14:18, 6.91s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1560/17840 [2:38:09<31:14:18, 6.91s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4587, 'learning_rate': 9.669239904988125e-05, 'epoch': 1.75} +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:30,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1561/17840 [2:38:16<31:05:15, 6.87s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1561/17840 [2:38:16<31:05:15, 6.87s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3738, 'learning_rate': 9.668646080760096e-05, 'epoch': 1.75} + 9%|██████▍ | 1561/17840 [2:38:16<31:05:15, 6.87s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:38,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:38,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:38,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5001, 'learning_rate': 9.668052256532068e-05, 'epoch': 1.75} +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:38,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1563/17840 [2:38:29<30:41:32, 6.79s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1563/17840 [2:38:29<30:41:32, 6.79s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3996, 'learning_rate': 9.667458432304038e-05, 'epoch': 1.75} +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:50,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1564/17840 [2:38:36<30:28:39, 6.74s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1564/17840 [2:38:36<30:28:39, 6.74s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2327, 'learning_rate': 9.666864608076009e-05, 'epoch': 1.75} + 9%|██████▍ | 1564/17840 [2:38:36<30:28:39, 6.74s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8337, 'learning_rate': 9.666270783847981e-05, 'epoch': 1.75} +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:19:58,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1566/17840 [2:38:49<30:11:00, 6.68s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:08,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:08,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:08,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1567/17840 [2:38:56<30:02:18, 6.65s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1567/17840 [2:38:56<30:02:18, 6.65s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:16,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:16,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1568/17840 [2:39:02<29:52:34, 6.61s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1568/17840 [2:39:02<29:52:34, 6.61s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:23,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1569/17840 [2:39:09<29:37:23, 6.55s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|████��█▍ | 1569/17840 [2:39:09<29:37:23, 6.55s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0515, 'learning_rate': 9.663895486935868e-05, 'epoch': 1.76} + 9%|██████▍ | 1569/17840 [2:39:09<29:37:23, 6.55s/it]g-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:30,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:30,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2091, 'learning_rate': 9.663301662707838e-05, 'epoch': 1.76} +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:30,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:30,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:30,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:17:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1571/17840 [2:39:21<29:01:01, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1571/17840 [2:39:21<29:01:01, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:43,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:43,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2457, 'learning_rate': 9.662114014251783e-05, 'epoch': 1.76} +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:43,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:49,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:49,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3338, 'learning_rate': 9.661520190023755e-05, 'epoch': 1.76} +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:49,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:55,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:55,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9396, 'learning_rate': 9.660926365795725e-05, 'epoch': 1.76} +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:55,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:20:55,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1575/17840 [2:39:48<30:56:58, 6.85s/it]g-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1575/17840 [2:39:48<30:56:58, 6.85s/it]g-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9483, 'learning_rate': 9.660332541567696e-05, 'epoch': 1.77} + 9%|██████▍ | 1575/17840 [2:39:48<30:56:58, 6.85s/it]g-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:09,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:09,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2075, 'learning_rate': 9.659738717339668e-05, 'epoch': 1.77} +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:14,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:14,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1577/17840 [2:40:00<28:39:57, 6.35s/it]g-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1577/17840 [2:40:00<28:39:57, 6.35s/it]g-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:20,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:20,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1578/17840 [2:40:05<27:46:14, 6.15s/it]g-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:24,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:24,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:24,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:20:38,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1579/17840 [2:40:11<27:01:41, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:28,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1579/17840 [2:40:11<27:01:41, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:28,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:32,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:28,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:32,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:28,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.085, 'learning_rate': 9.657363420427555e-05, 'epoch': 1.77} +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:36,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:28,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:36,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:28,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1581/17840 [2:40:22<25:29:17, 5.64s/it]g-point operations will not be computed-17 19:21:28,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:40,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:28,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:42,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:28,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:42,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:28,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.954, 'learning_rate': 9.656175771971497e-05, 'epoch': 1.77} +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:46,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:28,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:46,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:28,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1583/17840 [2:40:32<23:55:40, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:48,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:50,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:48,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:50,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:48,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1584/17840 [2:40:36<22:46:38, 5.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:53,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:55,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:53,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:55,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:53,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1585/17840 [2:40:40<21:39:05, 4.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:21:57,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:59,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:57,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:21:59,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:21:57,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1586/17840 [2:40:44<20:27:50, 4.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:01,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:03,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:01,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:03,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:01,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1587/17840 [2:40:48<19:15:34, 4.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:04,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1588/17840 [2:40:51<17:55:49, 3.97s/it]g-point operations will not be computed-17 19:22:04,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1588/17840 [2:40:51<17:55:49, 3.97s/it]g-point operations will not be computed-17 19:22:04,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:09,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:07,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:09,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:07,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1589/17840 [2:40:54<16:29:16, 3.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:10,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1590/17840 [2:40:57<15:08:01, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:13,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1590/17840 [2:40:57<15:08:01, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:13,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1591/17840 [2:40:59<13:47:35, 3.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:15,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1591/17840 [2:40:59<13:47:35, 3.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:15,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1592/17840 [2:41:01<12:30:37, 2.77s/it]g-point operations will not be computed-17 19:22:15,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1592/17840 [2:41:01<12:30:37, 2.77s/it]g-point operations will not be computed-17 19:22:15,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1592/17840 [2:41:01<12:30:37, 2.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:19,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1592/17840 [2:41:01<12:30:37, 2.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:19,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:23,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:19,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1593/17840 [2:41:09<19:18:11, 4.28s/it]g-point operations will not be computed-17 19:22:19,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1593/17840 [2:41:09<19:18:11, 4.28s/it]g-point operations will not be computed-17 19:22:19,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1593/17840 [2:41:09<19:18:11, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1593/17840 [2:41:09<19:18:11, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:30,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:30,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1594/17840 [2:41:17<23:43:54, 5.26s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1594/17840 [2:41:17<23:43:54, 5.26s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1594/17840 [2:41:17<23:43:54, 5.26s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1594/17840 [2:41:17<23:43:54, 5.26s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1594/17840 [2:41:17<23:43:54, 5.26s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1595/17840 [2:41:24<26:41:58, 5.92s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1595/17840 [2:41:24<26:41:58, 5.92s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:22:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1596/17840 [2:41:31<28:31:27, 6.32s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1596/17840 [2:41:31<28:31:27, 6.32s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3186, 'learning_rate': 9.647862232779098e-05, 'epoch': 1.79} + 9%|██████▌ | 1596/17840 [2:41:31<28:31:27, 6.32s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1596/17840 [2:41:31<28:31:27, 6.32s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1596/17840 [2:41:31<28:31:27, 6.32s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1597/17840 [2:41:39<30:01:17, 6.65s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1597/17840 [2:41:39<30:01:17, 6.65s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1597/17840 [2:41:39<30:01:17, 6.65s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:01,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:01,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1089, 'learning_rate': 9.64667458432304e-05, 'epoch': 1.79} +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:01,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:01,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1599/17840 [2:41:53<31:31:17, 6.99s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1599/17840 [2:41:53<31:31:17, 6.99s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2014, 'learning_rate': 9.646080760095013e-05, 'epoch': 1.79} + 9%|██████▌ | 1599/17840 [2:41:53<31:31:17, 6.99s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1599/17840 [2:41:53<31:31:17, 6.99s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1599/17840 [2:41:53<31:31:17, 6.99s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1600/17840 [2:42:03<35:16:05, 7.82s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1600/17840 [2:42:03<35:16:05, 7.82s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1600/17840 [2:42:03<35:16:05, 7.82s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:26,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:26,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2896, 'learning_rate': 9.644893111638955e-05, 'epoch': 1.79} +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:26,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:26,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1602/17840 [2:42:18<33:52:46, 7.51s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1602/17840 [2:42:18<33:52:46, 7.51s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2767, 'learning_rate': 9.644299287410927e-05, 'epoch': 1.8} + 9%|██████▌ | 1602/17840 [2:42:18<33:52:46, 7.51s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:40,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:40,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1863, 'learning_rate': 9.643705463182898e-05, 'epoch': 1.8} +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:40,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:40,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:40,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1604/17840 [2:42:32<32:54:56, 7.30s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1604/17840 [2:42:32<32:54:56, 7.30s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1604/17840 [2:42:32<32:54:56, 7.30s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:54,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:54,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3179, 'learning_rate': 9.642517814726841e-05, 'epoch': 1.8} +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:54,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:54,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:23:54,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1606/17840 [2:42:46<32:14:04, 7.15s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:05,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:05,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1607/17840 [2:42:53<31:52:13, 7.07s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1607/17840 [2:42:53<31:52:13, 7.07s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3681, 'learning_rate': 9.641330166270785e-05, 'epoch': 1.8} + 9%|██████▌ | 1607/17840 [2:42:53<31:52:13, 7.07s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:15,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:15,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0498, 'learning_rate': 9.640736342042755e-05, 'epoch': 1.8} +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:15,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:15,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1609/17840 [2:43:06<31:21:23, 6.95s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1609/17840 [2:43:06<31:21:23, 6.95s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:25,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:25,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1610/17840 [2:43:13<31:13:34, 6.93s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1610/17840 [2:43:13<31:13:34, 6.93s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0794, 'learning_rate': 9.639548693586698e-05, 'epoch': 1.8} + 9%|██████▌ | 1610/17840 [2:43:13<31:13:34, 6.93s/it]g-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:35,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:35,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3052, 'learning_rate': 9.63895486935867e-05, 'epoch': 1.81} +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:35,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:35,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:35,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:22:26,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1612/17840 [2:43:27<30:39:36, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1612/17840 [2:43:27<30:39:36, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1612/17840 [2:43:27<30:39:36, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1612/17840 [2:43:27<30:39:36, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1613/17840 [2:43:33<30:30:16, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:52,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:52,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:24:52,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1614/17840 [2:43:40<30:15:09, 6.71s/it]g-point operations will not be computed-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1614/17840 [2:43:40<30:15:09, 6.71s/it]g-point operations will not be computed-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1614/17840 [2:43:40<30:15:09, 6.71s/it]g-point operations will not be computed-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1614/17840 [2:43:40<30:15:09, 6.71s/it]g-point operations will not be computed-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:02,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:02,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:02,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:02,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:02,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:24:44,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1616/17840 [2:43:53<29:59:12, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1616/17840 [2:43:53<29:59:12, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1616/17840 [2:43:53<29:59:12, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1616/17840 [2:43:53<29:59:12, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1617/17840 [2:43:59<29:41:00, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:18,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:18,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1618/17840 [2:44:06<29:24:49, 6.53s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1618/17840 [2:44:06<29:24:49, 6.53s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:25,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:25,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:25,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1619/17840 [2:44:12<29:17:41, 6.50s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1619/17840 [2:44:12<29:17:41, 6.50s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:33,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:33,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1620/17840 [2:44:19<29:09:50, 6.47s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1620/17840 [2:44:19<29:09:50, 6.47s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1620/17840 [2:44:19<29:09:50, 6.47s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1620/17840 [2:44:19<29:09:50, 6.47s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:40,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:40,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:45,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:45,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1622/17840 [2:44:31<28:55:05, 6.42s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1622/17840 [2:44:31<28:55:05, 6.42s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1622/17840 [2:44:31<28:55:05, 6.42s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1622/17840 [2:44:31<28:55:05, 6.42s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:53,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:53,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:53,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:59,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:25:59,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9467, 'learning_rate': 9.6312351543943e-05, 'epoch': 1.82} +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:04,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1625/17840 [2:44:52<31:18:56, 6.95s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1625/17840 [2:44:52<31:18:56, 6.95s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1818, 'learning_rate': 9.63064133016627e-05, 'epoch': 1.82} + 9%|██████▋ | 1625/17840 [2:44:52<31:18:56, 6.95s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1625/17840 [2:44:52<31:18:56, 6.95s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1625/17840 [2:44:52<31:18:56, 6.95s/it]g-point operations will not be computed-17 19:25:10,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1626/17840 [2:44:58<30:12:46, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:26:15,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1626/17840 [2:44:58<30:12:46, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:26:15,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:20,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:15,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:20,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:15,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0103, 'learning_rate': 9.629453681710215e-05, 'epoch': 1.82} +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:24,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:15,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1628/17840 [2:45:10<28:12:30, 6.26s/it]g-point operations will not be computed-17 19:26:15,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1628/17840 [2:45:10<28:12:30, 6.26s/it]g-point operations will not be computed-17 19:26:15,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:28,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:15,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:28,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:15,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:28,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:15,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1629/17840 [2:45:16<27:31:21, 6.11s/it]g-point operations will not be computed-17 19:26:15,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:34,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:15,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:34,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:15,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:34,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:15,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1630/17840 [2:45:21<26:47:52, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:26:38,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1630/17840 [2:45:21<26:47:52, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:26:38,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:38,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:38,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9529, 'learning_rate': 9.6270783847981e-05, 'epoch': 1.83} +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:46,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:38,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:46,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:38,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1632/17840 [2:45:32<25:21:37, 5.63s/it]g-point operations will not be computed-17 19:26:38,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:50,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:38,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:53,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:38,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:53,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:38,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1714, 'learning_rate': 9.625890736342044e-05, 'epoch': 1.83} +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:56,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:38,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:26:56,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:38,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1634/17840 [2:45:42<23:31:14, 5.22s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:26:58,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:01,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:58,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:01,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:26:58,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1635/17840 [2:45:46<22:13:44, 4.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:03,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:05,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:03,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:05,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:03,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1636/17840 [2:45:50<21:09:19, 4.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:07,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:09,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:07,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:09,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:07,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1637/17840 [2:45:54<19:49:42, 4.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:10,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1638/17840 [2:45:57<18:20:50, 4.08s/it]g-point operations will not be computed-17 19:27:10,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1638/17840 [2:45:57<18:20:50, 4.08s/it]g-point operations will not be computed-17 19:27:10,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1638/17840 [2:45:57<18:20:50, 4.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:14,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1638/17840 [2:45:57<18:20:50, 4.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:14,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1639/17840 [2:46:00<16:56:13, 3.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:17,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1640/17840 [2:46:03<15:27:13, 3.43s/it]g-point operations will not be computed-17 19:27:17,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1640/17840 [2:46:03<15:27:13, 3.43s/it]g-point operations will not be computed-17 19:27:17,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:20,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:19,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:20,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:19,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1642/17840 [2:46:07<12:32:24, 2.79s/it]g-point operations will not be computed-17 19:27:21,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1642/17840 [2:46:07<12:32:24, 2.79s/it]g-point operations will not be computed-17 19:27:21,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1642/17840 [2:46:07<12:32:24, 2.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:25,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1642/17840 [2:46:07<12:32:24, 2.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:25,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:29,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:25,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1643/17840 [2:46:15<19:23:24, 4.31s/it]g-point operations will not be computed-17 19:27:25,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1643/17840 [2:46:15<19:23:24, 4.31s/it]g-point operations will not be computed-17 19:27:25,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1643/17840 [2:46:15<19:23:24, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1643/17840 [2:46:15<19:23:24, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:36,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:36,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1644/17840 [2:46:23<23:38:12, 5.25s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1644/17840 [2:46:23<23:38:12, 5.25s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1644/17840 [2:46:23<23:38:12, 5.25s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:46,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:46,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.064, 'learning_rate': 9.6187648456057e-05, 'epoch': 1.84} +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:46,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:27:46,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1646/17840 [2:46:38<28:39:24, 6.37s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1646/17840 [2:46:38<28:39:24, 6.37s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3099, 'learning_rate': 9.618171021377672e-05, 'epoch': 1.85} + 9%|██████▋ | 1646/17840 [2:46:38<28:39:24, 6.37s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1646/17840 [2:46:38<28:39:24, 6.37s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1646/17840 [2:46:38<28:39:24, 6.37s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1647/17840 [2:46:45<29:50:43, 6.64s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:04,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:04,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1648/17840 [2:46:52<30:47:07, 6.84s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1648/17840 [2:46:52<30:47:07, 6.84s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1869, 'learning_rate': 9.616983372921615e-05, 'epoch': 1.85} + 9%|██████▋ | 1648/17840 [2:46:52<30:47:07, 6.84s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1648/17840 [2:46:52<30:47:07, 6.84s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1649/17840 [2:46:59<31:11:02, 6.93s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1649/17840 [2:46:59<31:11:02, 6.93s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1646, 'learning_rate': 9.616389548693587e-05, 'epoch': 1.85} +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:20,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1650/17840 [2:47:09<34:53:03, 7.76s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1650/17840 [2:47:09<34:53:03, 7.76s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.456, 'learning_rate': 9.615795724465558e-05, 'epoch': 1.85} + 9%|██████▊ | 1650/17840 [2:47:09<34:53:03, 7.76s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1650/17840 [2:47:09<34:53:03, 7.76s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1651/17840 [2:47:16<34:09:49, 7.60s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1651/17840 [2:47:16<34:09:49, 7.60s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.836, 'learning_rate': 9.61520190023753e-05, 'epoch': 1.85} + 9%|██████▊ | 1651/17840 [2:47:16<34:09:49, 7.60s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:39,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:39,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3972, 'learning_rate': 9.614608076009502e-05, 'epoch': 1.85} +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:39,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:39,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███��██▊ | 1653/17840 [2:47:30<33:02:48, 7.35s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1653/17840 [2:47:30<33:02:48, 7.35s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9725, 'learning_rate': 9.614014251781474e-05, 'epoch': 1.85} +[WARNING|modeling_utils.py:388] 2022-03-17 19:28:51,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1654/17840 [2:47:37<32:31:57, 7.24s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1654/17840 [2:47:37<32:31:57, 7.24s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0705, 'learning_rate': 9.613420427553445e-05, 'epoch': 1.85} + 9%|██████▊ | 1654/17840 [2:47:37<32:31:57, 7.24s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1654/17840 [2:47:37<32:31:57, 7.24s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1655/17840 [2:47:44<32:09:44, 7.15s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1655/17840 [2:47:44<32:09:44, 7.15s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9887, 'learning_rate': 9.612826603325417e-05, 'epoch': 1.86} +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:05,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1656/17840 [2:47:51<31:55:39, 7.10s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1656/17840 [2:47:51<31:55:39, 7.10s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1493, 'learning_rate': 9.612232779097387e-05, 'epoch': 1.86} + 9%|██████▊ | 1656/17840 [2:47:51<31:55:39, 7.10s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1656/17840 [2:47:51<31:55:39, 7.10s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1657/17840 [2:47:58<31:46:42, 7.07s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1657/17840 [2:47:58<31:46:42, 7.07s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:17,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:17,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1658/17840 [2:48:05<31:36:43, 7.03s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1658/17840 [2:48:05<31:36:43, 7.03s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2771, 'learning_rate': 9.61104513064133e-05, 'epoch': 1.86} + 9%|██████▊ | 1658/17840 [2:48:05<31:36:43, 7.03s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:28,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:28,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1395, 'learning_rate': 9.610451306413302e-05, 'epoch': 1.86} +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:28,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:28,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:28,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1660/17840 [2:48:19<31:12:13, 6.94s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:38,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:38,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:38,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1661/17840 [2:48:26<30:50:33, 6.86s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1661/17840 [2:48:26<30:50:33, 6.86s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1661/17840 [2:48:26<30:50:33, 6.86s/it]g-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:48,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:48,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1935, 'learning_rate': 9.608669833729217e-05, 'epoch': 1.86} +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:48,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:48,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:29:48,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:27:33,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1663/17840 [2:48:39<30:29:05, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1663/17840 [2:48:39<30:29:05, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1663/17840 [2:48:39<30:29:05, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1663/17840 [2:48:39<30:29:05, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1664/17840 [2:48:46<30:21:54, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1664/17840 [2:48:46<30:21:54, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:06,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:06,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1665/17840 [2:48:53<30:18:53, 6.75s/it]g-point operations will not be computed-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1665/17840 [2:48:53<30:18:53, 6.75s/it]g-point operations will not be computed-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1665/17840 [2:48:53<30:18:53, 6.75s/it]g-point operations will not be computed-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:15,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:15,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1972, 'learning_rate': 9.606294536817104e-05, 'epoch': 1.87} +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:15,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:15,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:15,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:29:56,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1667/17840 [2:49:06<29:52:54, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1667/17840 [2:49:06<29:52:54, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1667/17840 [2:49:06<29:52:54, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1667/17840 [2:49:06<29:52:54, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1668/17840 [2:49:12<29:35:45, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:31,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:31,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:31,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1669/17840 [2:49:19<29:21:02, 6.53s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:37,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:37,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:37,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1670/17840 [2:49:25<29:13:33, 6.51s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1670/17840 [2:49:25<29:13:33, 6.51s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:45,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:45,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1671/17840 [2:49:31<28:59:35, 6.46s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1671/17840 [2:49:31<28:59:35, 6.46s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:52,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1672/17840 [2:49:38<28:49:12, 6.42s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1672/17840 [2:49:38<28:49:12, 6.42s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9001, 'learning_rate': 9.602731591448932e-05, 'epoch': 1.87} +[WARNING|modeling_utils.py:388] 2022-03-17 19:30:58,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1673/17840 [2:49:44<28:36:48, 6.37s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1673/17840 [2:49:44<28:36:48, 6.37s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5382, 'learning_rate': 9.602137767220904e-05, 'epoch': 1.88} + 9%|██████▊ | 1673/17840 [2:49:44<28:36:48, 6.37s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:06,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:06,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3851, 'learning_rate': 9.601543942992875e-05, 'epoch': 1.88} +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:06,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:06,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1675/17840 [2:49:58<30:58:32, 6.90s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1675/17840 [2:49:58<30:58:32, 6.90s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0739, 'learning_rate': 9.600950118764847e-05, 'epoch': 1.88} + 9%|██████▊ | 1675/17840 [2:49:58<30:58:32, 6.90s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:20,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:20,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1496, 'learning_rate': 9.600356294536817e-05, 'epoch': 1.88} +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:24,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:24,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1677/17840 [2:50:10<28:36:31, 6.37s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1677/17840 [2:50:10<28:36:31, 6.37s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:30,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:30,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1678/17840 [2:50:16<27:41:38, 6.17s/it]g-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:34,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:34,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:34,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:30:23,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1679/17840 [2:50:21<26:53:34, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:31:38,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1679/17840 [2:50:21<26:53:34, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:31:38,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:42,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:31:38,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:42,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:31:38,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0302, 'learning_rate': 9.597980997624704e-05, 'epoch': 1.88} +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:46,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:31:38,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:46,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:31:38,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1681/17840 [2:50:32<25:20:41, 5.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:31:49,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1681/17840 [2:50:32<25:20:41, 5.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:31:49,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:52,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:31:49,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:52,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:31:49,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:55,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:31:49,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:57,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:31:49,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:31:57,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:31:49,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3335, 'learning_rate': 9.596199524940617e-05, 'epoch': 1.89} +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:01,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:31:49,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:01,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:31:49,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1684/17840 [2:50:46<22:38:55, 5.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:32:03,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:05,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:03,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1685/17840 [2:50:51<21:42:58, 4.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:32:07,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1685/17840 [2:50:51<21:42:58, 4.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:32:07,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:09,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:07,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1686/17840 [2:50:55<20:31:52, 4.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:32:11,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1686/17840 [2:50:55<20:31:52, 4.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:32:11,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:13,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:11,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:13,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:11,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1687/17840 [2:50:58<19:14:34, 4.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:32:15,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1688/17840 [2:51:02<17:54:31, 3.99s/it]g-point operations will not be computed-17 19:32:15,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1688/17840 [2:51:02<17:54:31, 3.99s/it]g-point operations will not be computed-17 19:32:15,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:19,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:18,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:19,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:18,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1689/17840 [2:51:05<16:30:01, 3.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:32:21,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1690/17840 [2:51:07<15:10:11, 3.38s/it]g-point operations will not be computed-17 19:32:21,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1690/17840 [2:51:07<15:10:11, 3.38s/it]g-point operations will not be computed-17 19:32:21,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1691/17840 [2:51:10<13:46:24, 3.07s/it]g-point operations will not be computed-17 19:32:23,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1691/17840 [2:51:10<13:46:24, 3.07s/it]g-point operations will not be computed-17 19:32:23,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1692/17840 [2:51:12<12:22:45, 2.76s/it]g-point operations will not be computed-17 19:32:26,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1692/17840 [2:51:12<12:22:45, 2.76s/it]g-point operations will not be computed-17 19:32:26,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1692/17840 [2:51:12<12:22:45, 2.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:32:29,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1692/17840 [2:51:12<12:22:45, 2.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:32:29,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:33,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:29,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1693/17840 [2:51:19<19:13:44, 4.29s/it]g-point operations will not be computed-17 19:32:29,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1693/17840 [2:51:19<19:13:44, 4.29s/it]g-point operations will not be computed-17 19:32:29,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1693/17840 [2:51:19<19:13:44, 4.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1693/17840 [2:51:19<19:13:44, 4.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:41,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1694/17840 [2:51:27<23:47:46, 5.31s/it]g-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1694/17840 [2:51:27<23:47:46, 5.31s/it]g-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3323, 'learning_rate': 9.589667458432304e-05, 'epoch': 1.9} + 9%|██████▉ | 1694/17840 [2:51:27<23:47:46, 5.31s/it]g-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1694/17840 [2:51:27<23:47:46, 5.31s/it]g-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1695/17840 [2:51:35<26:54:36, 6.00s/it]g-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1695/17840 [2:51:35<26:54:36, 6.00s/it]g-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1168, 'learning_rate': 9.589073634204276e-05, 'epoch': 1.9} + 10%|██████▉ | 1695/17840 [2:51:35<26:54:36, 6.00s/it]g-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:58,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:58,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0913, 'learning_rate': 9.588479809976247e-05, 'epoch': 1.9} +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:58,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:32:58,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1697/17840 [2:51:49<30:01:20, 6.70s/it]g-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1697/17840 [2:51:49<30:01:20, 6.70s/it]g-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0945, 'learning_rate': 9.587885985748219e-05, 'epoch': 1.9} + 10%|██████▉ | 1697/17840 [2:51:49<30:01:20, 6.70s/it]g-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1697/17840 [2:51:49<30:01:20, 6.70s/it]g-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1697/17840 [2:51:49<30:01:20, 6.70s/it]g-point operations will not be computed-17 19:32:37,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1698/17840 [2:51:57<30:51:25, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1698/17840 [2:51:57<30:51:25, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1698/17840 [2:51:57<30:51:25, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1699/17840 [2:52:04<31:19:10, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1699/17840 [2:52:04<31:19:10, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1537, 'learning_rate': 9.586698337292162e-05, 'epoch': 1.9} + 10%|██████▉ | 1699/17840 [2:52:04<31:19:10, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1699/17840 [2:52:04<31:19:10, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1700/17840 [2:52:14<34:46:28, 7.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1700/17840 [2:52:14<34:46:28, 7.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2618, 'learning_rate': 9.586104513064134e-05, 'epoch': 1.91} + 10%|██████▉ | 1700/17840 [2:52:14<34:46:28, 7.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:36,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:36,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0846, 'learning_rate': 9.585510688836105e-05, 'epoch': 1.91} +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:36,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:33:36,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1702/17840 [2:52:28<33:35:42, 7.49s/it]g-point operations will not be computed-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1702/17840 [2:52:28<33:35:42, 7.49s/it]g-point operations will not be computed-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.271, 'learning_rate': 9.584916864608077e-05, 'epoch': 1.91} + 10%|██████▉ | 1702/17840 [2:52:28<33:35:42, 7.49s/it]g-point operations will not be computed-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1702/17840 [2:52:28<33:35:42, 7.49s/it]g-point operations will not be computed-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1702/17840 [2:52:28<33:35:42, 7.49s/it]g-point operations will not be computed-17 19:33:14,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1703/17840 [2:52:35<33:02:02, 7.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:52,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1703/17840 [2:52:35<33:02:02, 7.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:52,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1703/17840 [2:52:35<33:02:02, 7.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:52,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1704/17840 [2:52:42<32:35:00, 7.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:52,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1704/17840 [2:52:42<32:35:00, 7.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:52,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2472, 'learning_rate': 9.58372921615202e-05, 'epoch': 1.91} + 10%|██████▉ | 1704/17840 [2:52:42<32:35:00, 7.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:52,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1704/17840 [2:52:42<32:35:00, 7.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:52,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1704/17840 [2:52:42<32:35:00, 7.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:33:52,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1705/17840 [2:52:49<32:14:08, 7.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1705/17840 [2:52:49<32:14:08, 7.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1705/17840 [2:52:49<32:14:08, 7.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1706/17840 [2:52:56<31:55:21, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1706/17840 [2:52:56<31:55:21, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9006, 'learning_rate': 9.582541567695963e-05, 'epoch': 1.91} + 10%|██████▉ | 1706/17840 [2:52:56<31:55:21, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:19,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:19,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8795, 'learning_rate': 9.581947743467934e-05, 'epoch': 1.91} +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:19,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:19,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:19,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1708/17840 [2:53:10<31:22:19, 7.00s/it]g-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:29,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:29,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1709/17840 [2:53:17<31:15:32, 6.98s/it]g-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1709/17840 [2:53:17<31:15:32, 6.98s/it]g-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0363, 'learning_rate': 9.580760095011877e-05, 'epoch': 1.92} + 10%|██████▉ | 1709/17840 [2:53:17<31:15:32, 6.98s/it]g-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:39,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:39,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9387, 'learning_rate': 9.580166270783848e-05, 'epoch': 1.92} +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:39,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:39,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:07,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1711/17840 [2:53:31<30:55:22, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:48,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1711/17840 [2:53:31<30:55:22, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:48,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0323, 'learning_rate': 9.57957244655582e-05, 'epoch': 1.92} + 10%|███████ | 1711/17840 [2:53:31<30:55:22, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:48,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1712/17840 [2:53:37<30:36:15, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:48,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1712/17840 [2:53:37<30:36:15, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:34:48,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:56,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:48,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:56,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:48,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:34:56,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:34:48,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1713/17840 [2:53:44<30:27:28, 6.80s/it]g-point operations will not be computed-17 19:34:48,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1713/17840 [2:53:44<30:27:28, 6.80s/it]g-point operations will not be computed-17 19:34:48,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1713/17840 [2:53:44<30:27:28, 6.80s/it]g-point operations will not be computed-17 19:34:48,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1713/17840 [2:53:44<30:27:28, 6.80s/it]g-point operations will not be computed-17 19:34:48,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8617, 'learning_rate': 9.577790973871734e-05, 'epoch': 1.92} + 10%|███████ | 1714/17840 [2:53:51<30:15:52, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1714/17840 [2:53:51<30:15:52, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1714/17840 [2:53:51<30:15:52, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1714/17840 [2:53:51<30:15:52, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1715/17840 [2:53:57<30:05:26, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:16,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:16,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:16,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1716/17840 [2:54:04<29:56:15, 6.68s/it]g-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1716/17840 [2:54:04<29:56:15, 6.68s/it]g-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:24,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:24,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1717/17840 [2:54:10<29:50:41, 6.66s/it]g-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1717/17840 [2:54:10<29:50:41, 6.66s/it]g-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1717/17840 [2:54:10<29:50:41, 6.66s/it]g-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1717/17840 [2:54:10<29:50:41, 6.66s/it]g-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:32,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:32,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:32,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:39,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:39,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0946, 'learning_rate': 9.574821852731592e-05, 'epoch': 1.93} +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:39,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:45,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:45,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0806, 'learning_rate': 9.574228028503564e-05, 'epoch': 1.93} +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:45,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:45,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:35:45,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:08,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1721/17840 [2:54:36<28:58:16, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1721/17840 [2:54:36<28:58:16, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1721/17840 [2:54:36<28:58:16, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1721/17840 [2:54:36<28:58:16, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1722/17840 [2:54:42<28:43:03, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:01,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:01,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:01,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1723/17840 [2:54:49<28:25:21, 6.35s/it]g-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:07,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:07,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:07,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1724/17840 [2:54:55<28:05:53, 6.28s/it]g-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:13,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:13,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:13,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1725/17840 [2:55:03<30:50:28, 6.89s/it]g-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:22,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:22,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:22,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1726/17840 [2:55:09<29:37:18, 6.62s/it]g-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:27,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:30,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:30,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0116, 'learning_rate': 9.570071258907364e-05, 'epoch': 1.94} +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:30,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:30,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:30,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:35:53,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1728/17840 [2:55:21<27:46:30, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:38,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1728/17840 [2:55:21<27:46:30, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:38,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:42,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:38,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:42,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:38,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2299, 'learning_rate': 9.568883610451307e-05, 'epoch': 1.94} +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:46,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:38,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1730/17840 [2:55:32<26:18:52, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:49,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1730/17840 [2:55:32<26:18:52, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:49,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0102, 'learning_rate': 9.568289786223277e-05, 'epoch': 1.94} + 10%|███████ | 1730/17840 [2:55:32<26:18:52, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:49,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1730/17840 [2:55:32<26:18:52, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:49,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1731/17840 [2:55:37<25:35:46, 5.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:36:54,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:36:57,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1732/17840 [2:55:42<24:53:14, 5.56s/it]g-point operations will not be computed-17 19:36:54,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1732/17840 [2:55:42<24:53:14, 5.56s/it]g-point operations will not be computed-17 19:36:54,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:00,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:03,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:03,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.971, 'learning_rate': 9.566508313539194e-05, 'epoch': 1.94} +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:06,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:36:54,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1734/17840 [2:55:52<23:06:35, 5.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1734/17840 [2:55:52<23:06:35, 5.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9831, 'learning_rate': 9.565914489311164e-05, 'epoch': 1.94} +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:12,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:12,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:14,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:16,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:16,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:18,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:20,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:20,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:23,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:23,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:25,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:26,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:26,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:29,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:29,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:31,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:31,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:33,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:33,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5726, 'learning_rate': 9.561163895486936e-05, 'epoch': 1.95} +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:37,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:37,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:37,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:41,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:41,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:45,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:45,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:45,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:49,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:49,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:49,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:49,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:37:49,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1745/17840 [2:56:41<26:40:14, 5.97s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:00,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:00,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:00,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1746/17840 [2:56:48<28:38:43, 6.41s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1746/17840 [2:56:48<28:38:43, 6.41s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1746/17840 [2:56:48<28:38:43, 6.41s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1746/17840 [2:56:48<28:38:43, 6.41s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1746/17840 [2:56:48<28:38:43, 6.41s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1747/17840 [2:56:55<30:04:42, 6.73s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1747/17840 [2:56:55<30:04:42, 6.73s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1747/17840 [2:56:55<30:04:42, 6.73s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:18,866 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:18,866 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9096, 'learning_rate': 9.557600950118766e-05, 'epoch': 1.96} +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:18,866 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:18,866 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:18,866 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1749/17840 [2:57:10<31:29:08, 7.04s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1749/17840 [2:57:10<31:29:08, 7.04s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1749/17840 [2:57:10<31:29:08, 7.04s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1749/17840 [2:57:10<31:29:08, 7.04s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1749/17840 [2:57:10<31:29:08, 7.04s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1750/17840 [2:57:20<34:48:31, 7.79s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1750/17840 [2:57:20<34:48:31, 7.79s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1750/17840 [2:57:20<34:48:31, 7.79s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:42,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:42,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0426, 'learning_rate': 9.555819477434679e-05, 'epoch': 1.96} +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:42,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:42,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:42,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1752/17840 [2:57:34<33:13:45, 7.44s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1752/17840 [2:57:34<33:13:45, 7.44s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:38:55,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1753/17840 [2:57:41<32:39:57, 7.31s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1753/17840 [2:57:41<32:39:57, 7.31s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.178, 'learning_rate': 9.554631828978623e-05, 'epoch': 1.97} + 10%|███████▏ | 1753/17840 [2:57:41<32:39:57, 7.31s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1753/17840 [2:57:41<32:39:57, 7.31s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1753/17840 [2:57:41<32:39:57, 7.31s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1754/17840 [2:57:48<32:14:33, 7.22s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1754/17840 [2:57:48<32:14:33, 7.22s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:09,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:09,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1755/17840 [2:57:55<31:52:10, 7.13s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1755/17840 [2:57:55<31:52:10, 7.13s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1755/17840 [2:57:55<31:52:10, 7.13s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:17,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:17,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0329, 'learning_rate': 9.552850356294537e-05, 'epoch': 1.97} +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:17,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:17,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:17,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1757/17840 [2:58:09<31:28:26, 7.05s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:28,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:28,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1758/17840 [2:58:16<31:13:43, 6.99s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1758/17840 [2:58:16<31:13:43, 6.99s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2081, 'learning_rate': 9.55166270783848e-05, 'epoch': 1.97} + 10%|███████▏ | 1758/17840 [2:58:16<31:13:43, 6.99s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8456, 'learning_rate': 9.551068883610453e-05, 'epoch': 1.97} +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:38,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1760/17840 [2:58:29<30:42:36, 6.88s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:48,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:48,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1761/17840 [2:58:36<30:23:18, 6.80s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1761/17840 [2:58:36<30:23:18, 6.80s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0963, 'learning_rate': 9.549881235154394e-05, 'epoch': 1.97} + 10%|███████▏ | 1761/17840 [2:58:36<30:23:18, 6.80s/it]g-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:58,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:58,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5019, 'learning_rate': 9.549287410926366e-05, 'epoch': 1.98} +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:58,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:58,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:39:58,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:37:09,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1763/17840 [2:58:49<30:00:06, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1763/17840 [2:58:49<30:00:06, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1763/17840 [2:58:49<30:00:06, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1764/17840 [2:58:56<29:49:52, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1764/17840 [2:58:56<29:49:52, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:15,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:15,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1765/17840 [2:59:02<29:39:43, 6.64s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1765/17840 [2:59:02<29:39:43, 6.64s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:21,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:21,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1766/17840 [2:59:09<29:12:29, 6.54s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1766/17840 [2:59:09<29:12:29, 6.54s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1325, 'learning_rate': 9.546912114014253e-05, 'epoch': 1.98} +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:29,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1767/17840 [2:59:15<28:49:50, 6.46s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1767/17840 [2:59:15<28:49:50, 6.46s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.003, 'learning_rate': 9.546318289786224e-05, 'epoch': 1.98} +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:35,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1768/17840 [2:59:21<28:25:33, 6.37s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1768/17840 [2:59:21<28:25:33, 6.37s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3335, 'learning_rate': 9.545724465558196e-05, 'epoch': 1.98} +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:41,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1769/17840 [2:59:27<28:03:26, 6.29s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1769/17840 [2:59:27<28:03:26, 6.29s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.877, 'learning_rate': 9.545130641330166e-05, 'epoch': 1.98} +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:47,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1770/17840 [2:59:33<27:40:35, 6.20s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1770/17840 [2:59:33<27:40:35, 6.20s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9492, 'learning_rate': 9.544536817102139e-05, 'epoch': 1.98} +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:53,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1771/17840 [2:59:39<27:19:46, 6.12s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1771/17840 [2:59:39<27:19:46, 6.12s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:57,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:40:57,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1772/17840 [2:59:45<26:57:18, 6.04s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1772/17840 [2:59:45<26:57:18, 6.04s/it]g-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:03,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:03,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:03,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:40:06,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1773/17840 [2:59:51<26:26:21, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:08,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1773/17840 [2:59:51<26:26:21, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:08,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:12,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:08,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:12,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:08,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8841, 'learning_rate': 9.542161520190024e-05, 'epoch': 1.99} +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:15,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:08,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1775/17840 [3:00:03<27:55:38, 6.26s/it]g-point operations will not be computed-17 19:41:08,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1775/17840 [3:00:03<27:55:38, 6.26s/it]g-point operations will not be computed-17 19:41:08,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:21,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:08,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:21,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:08,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:21,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:08,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1776/17840 [3:00:08<26:10:30, 5.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:25,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:27,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:25,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:27,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:25,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1777/17840 [3:00:13<24:26:07, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:30,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:32,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:30,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:32,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:30,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1778/17840 [3:00:17<22:43:36, 5.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:34,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:35,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:35,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:34,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1779/17840 [3:00:21<21:00:12, 4.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:37,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 19:41:37,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 19:41:37,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1780/17840 [3:00:24<19:19:15, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:41,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1781/17840 [3:00:27<17:39:49, 3.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:44,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1781/17840 [3:00:27<17:39:49, 3.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:44,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1782/17840 [3:00:30<16:00:48, 3.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:46,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1782/17840 [3:00:30<16:00:48, 3.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:46,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:48,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:46,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:48,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:46,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:50,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:49,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:50,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:49,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1784/17840 [3:00:35<12:53:52, 2.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:53,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1784/17840 [3:00:35<12:53:52, 2.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:41:53,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:41:56,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:41:53,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1785/17840 [3:00:43<19:46:34, 4.43s/it]g-point operations will not be computed-17 19:41:53,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1785/17840 [3:00:43<19:46:34, 4.43s/it]g-point operations will not be computed-17 19:41:53,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1785/17840 [3:00:43<19:46:34, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1785/17840 [3:00:43<19:46:34, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:04,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1786/17840 [3:00:50<24:04:16, 5.40s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1786/17840 [3:00:50<24:04:16, 5.40s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6146, 'learning_rate': 9.535035629453683e-05, 'epoch': 2.0} + 10%|███████▎ | 1786/17840 [3:00:50<24:04:16, 5.40s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1786/17840 [3:00:50<24:04:16, 5.40s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1787/17840 [3:00:58<26:52:39, 6.03s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1787/17840 [3:00:58<26:52:39, 6.03s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.851, 'learning_rate': 9.534441805225654e-05, 'epoch': 2.0} +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:19,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:19,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1788/17840 [3:01:05<28:43:59, 6.44s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1788/17840 [3:01:05<28:43:59, 6.44s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1788/17840 [3:01:05<28:43:59, 6.44s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1788/17840 [3:01:05<28:43:59, 6.44s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1788/17840 [3:01:05<28:43:59, 6.44s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1789/17840 [3:01:13<29:59:03, 6.73s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1789/17840 [3:01:13<29:59:03, 6.73s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1789/17840 [3:01:13<29:59:03, 6.73s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1789/17840 [3:01:13<29:59:03, 6.73s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1789/17840 [3:01:13<29:59:03, 6.73s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1790/17840 [3:01:20<30:49:25, 6.91s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:39,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:39,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:39,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1791/17840 [3:01:27<31:16:07, 7.01s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1791/17840 [3:01:27<31:16:07, 7.01s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1791/17840 [3:01:27<31:16:07, 7.01s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1791/17840 [3:01:27<31:16:07, 7.01s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1791/17840 [3:01:27<31:16:07, 7.01s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1792/17840 [3:01:34<31:31:55, 7.07s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:54,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:54,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:42:54,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1793/17840 [3:01:42<31:41:43, 7.11s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1793/17840 [3:01:42<31:41:43, 7.11s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1793/17840 [3:01:42<31:41:43, 7.11s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1793/17840 [3:01:42<31:41:43, 7.11s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1793/17840 [3:01:42<31:41:43, 7.11s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1794/17840 [3:01:49<31:49:29, 7.14s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1794/17840 [3:01:49<31:49:29, 7.14s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:10,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1795/17840 [3:01:56<31:45:46, 7.13s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1795/17840 [3:01:56<31:45:46, 7.13s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0702, 'learning_rate': 9.529691211401426e-05, 'epoch': 2.01} + 10%|███████▎ | 1795/17840 [3:01:56<31:45:46, 7.13s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1795/17840 [3:01:56<31:45:46, 7.13s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1795/17840 [3:01:56<31:45:46, 7.13s/it]g-point operations will not be computed-17 19:42:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1796/17840 [3:02:03<31:36:00, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1796/17840 [3:02:03<31:36:00, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1796/17840 [3:02:03<31:36:00, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1796/17840 [3:02:03<31:36:00, 7.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1797/17840 [3:02:10<31:37:12, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1797/17840 [3:02:10<31:37:12, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1797/17840 [3:02:10<31:37:12, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:33,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:33,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5909, 'learning_rate': 9.52790973871734e-05, 'epoch': 2.02} +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:33,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:33,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:33,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1799/17840 [3:02:24<31:21:40, 7.04s/it]g-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1799/17840 [3:02:24<31:21:40, 7.04s/it]g-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:43:45,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1800/17840 [3:02:33<34:24:50, 7.72s/it]g-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1800/17840 [3:02:33<34:24:50, 7.72s/it]g-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0292, 'learning_rate': 9.526722090261283e-05, 'epoch': 2.02} + 10%|███████▎ | 1800/17840 [3:02:33<34:24:50, 7.72s/it]g-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1800/17840 [3:02:33<34:24:50, 7.72s/it]g-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1800/17840 [3:02:33<34:24:50, 7.72s/it]g-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1801/17840 [3:02:40<33:25:30, 7.50s/it]g-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1801/17840 [3:02:40<33:25:30, 7.50s/it]g-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:01,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1802/17840 [3:02:47<32:36:36, 7.32s/it]g-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1802/17840 [3:02:47<32:36:36, 7.32s/it]g-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9143, 'learning_rate': 9.525534441805226e-05, 'epoch': 2.02} + 10%|███████▎ | 1802/17840 [3:02:47<32:36:36, 7.32s/it]g-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1802/17840 [3:02:47<32:36:36, 7.32s/it]g-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1802/17840 [3:02:47<32:36:36, 7.32s/it]g-point operations will not be computed-17 19:43:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1803/17840 [3:02:54<31:55:05, 7.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:11,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1803/17840 [3:02:54<31:55:05, 7.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:11,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1803/17840 [3:02:54<31:55:05, 7.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:11,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1803/17840 [3:02:54<31:55:05, 7.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:11,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1804/17840 [3:03:01<31:23:08, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:11,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:20,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:11,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:20,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:11,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1805/17840 [3:03:08<30:58:43, 6.95s/it]g-point operations will not be computed-17 19:44:11,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1805/17840 [3:03:08<30:58:43, 6.95s/it]g-point operations will not be computed-17 19:44:11,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6742, 'learning_rate': 9.523752969121141e-05, 'epoch': 2.02} + 10%|███████▍ | 1805/17840 [3:03:08<30:58:43, 6.95s/it]g-point operations will not be computed-17 19:44:11,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1805/17840 [3:03:08<30:58:43, 6.95s/it]g-point operations will not be computed-17 19:44:11,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1805/17840 [3:03:08<30:58:43, 6.95s/it]g-point operations will not be computed-17 19:44:11,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1806/17840 [3:03:14<30:44:15, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1806/17840 [3:03:14<30:44:15, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1806/17840 [3:03:14<30:44:15, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1806/17840 [3:03:14<30:44:15, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1807/17840 [3:03:21<30:30:32, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:40,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:40,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1808/17840 [3:03:28<30:16:23, 6.80s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1808/17840 [3:03:28<30:16:23, 6.80s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2877, 'learning_rate': 9.521971496437056e-05, 'epoch': 2.03} +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:48,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1809/17840 [3:03:34<30:00:27, 6.74s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1809/17840 [3:03:34<30:00:27, 6.74s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8235, 'learning_rate': 9.521377672209026e-05, 'epoch': 2.03} + 10%|███████▍ | 1809/17840 [3:03:34<30:00:27, 6.74s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:56,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:56,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7491, 'learning_rate': 9.520783847980998e-05, 'epoch': 2.03} +[WARNING|modeling_utils.py:388] 2022-03-17 19:44:56,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:03,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:03,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6985, 'learning_rate': 9.520190023752969e-05, 'epoch': 2.03} +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:03,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:03,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1812/17840 [3:03:54<29:16:51, 6.58s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1812/17840 [3:03:54<29:16:51, 6.58s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:13,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:13,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1813/17840 [3:04:00<29:00:36, 6.52s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1813/17840 [3:04:00<29:00:36, 6.52s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:19,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:19,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1814/17840 [3:04:07<28:40:28, 6.44s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1814/17840 [3:04:07<28:40:28, 6.44s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:25,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:25,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1815/17840 [3:04:13<28:17:51, 6.36s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1815/17840 [3:04:13<28:17:51, 6.36s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1303, 'learning_rate': 9.517814726840856e-05, 'epoch': 2.03} +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:33,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1816/17840 [3:04:19<27:57:01, 6.28s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1816/17840 [3:04:19<27:57:01, 6.28s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:37,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1817/17840 [3:04:25<27:37:41, 6.21s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1817/17840 [3:04:25<27:37:41, 6.21s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:43,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:43,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1818/17840 [3:04:31<27:18:12, 6.13s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1818/17840 [3:04:31<27:18:12, 6.13s/it]g-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:49,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:49,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:49,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:44:32,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1819/17840 [3:04:37<26:54:17, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1819/17840 [3:04:37<26:54:17, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1819/17840 [3:04:37<26:54:17, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:58,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:45:58,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:02,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:02,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1821/17840 [3:04:48<25:47:16, 5.80s/it]g-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:06,443 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:09,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:09,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7599, 'learning_rate': 9.513657957244656e-05, 'epoch': 2.04} +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:12,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:12,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1823/17840 [3:04:58<24:23:22, 5.48s/it]g-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:16,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:19,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:19,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5808, 'learning_rate': 9.512470308788599e-05, 'epoch': 2.04} +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:22,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:22,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:45:54,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1825/17840 [3:05:10<25:38:14, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██��████▍ | 1825/17840 [3:05:10<25:38:14, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1825/17840 [3:05:10<25:38:14, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:30,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:32,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:32,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:34,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:36,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:36,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:38,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:40,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:40,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:43,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:45,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:45,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:46,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:46,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:49,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:49,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:50,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:52,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:52,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:54,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:54,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.2988, 'learning_rate': 9.506532066508314e-05, 'epoch': 2.06} +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:59,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:59,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:46:59,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:02,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:02,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:06,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:06,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:06,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:10,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:10,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:10,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:17,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:17,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6667, 'learning_rate': 9.504750593824228e-05, 'epoch': 2.06} +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:17,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:17,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:17,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1838/17840 [3:06:09<28:15:47, 6.36s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1838/17840 [3:06:09<28:15:47, 6.36s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1838/17840 [3:06:09<28:15:47, 6.36s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1838/17840 [3:06:09<28:15:47, 6.36s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1838/17840 [3:06:09<28:15:47, 6.36s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1839/17840 [3:06:17<29:36:40, 6.66s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1839/17840 [3:06:17<29:36:40, 6.66s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:38,108 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1840/17840 [3:06:24<30:22:23, 6.83s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1840/17840 [3:06:24<30:22:23, 6.83s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6945, 'learning_rate': 9.502969121140143e-05, 'epoch': 2.06} + 10%|███████▌ | 1840/17840 [3:06:24<30:22:23, 6.83s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1840/17840 [3:06:24<30:22:23, 6.83s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1840/17840 [3:06:24<30:22:23, 6.83s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1841/17840 [3:06:31<30:52:11, 6.95s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|█████���█▌ | 1841/17840 [3:06:31<30:52:11, 6.95s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:47:52,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8651, 'learning_rate': 9.501781472684086e-05, 'epoch': 2.07} + g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1843/17840 [3:06:46<31:33:07, 7.10s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1843/17840 [3:06:46<31:33:07, 7.10s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:06,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1844/17840 [3:06:53<31:29:52, 7.09s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1844/17840 [3:06:53<31:29:52, 7.09s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.591, 'learning_rate': 9.500593824228028e-05, 'epoch': 2.07} + 10%|███████▌ | 1844/17840 [3:06:53<31:29:52, 7.09s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1844/17840 [3:06:53<31:29:52, 7.09s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1844/17840 [3:06:53<31:29:52, 7.09s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1845/17840 [3:07:00<31:23:48, 7.07s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:19,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:19,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1846/17840 [3:07:07<31:22:16, 7.06s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1846/17840 [3:07:07<31:22:16, 7.06s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6679, 'learning_rate': 9.499406175771973e-05, 'epoch': 2.07} + 10%|███████▌ | 1846/17840 [3:07:07<31:22:16, 7.06s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:29,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:29,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9947, 'learning_rate': 9.498812351543943e-05, 'epoch': 2.07} +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:29,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:29,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1848/17840 [3:07:21<31:12:31, 7.03s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1848/17840 [3:07:21<31:12:31, 7.03s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8689, 'learning_rate': 9.498218527315915e-05, 'epoch': 2.07} + 10%|███████▌ | 1848/17840 [3:07:21<31:12:31, 7.03s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:43,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:43,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8943, 'learning_rate': 9.497624703087886e-05, 'epoch': 2.07} +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:43,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:43,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1850/17840 [3:07:37<34:05:44, 7.68s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1850/17840 [3:07:37<34:05:44, 7.68s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7498, 'learning_rate': 9.497030878859858e-05, 'epoch': 2.07} +[WARNING|modeling_utils.py:388] 2022-03-17 19:48:58,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1851/17840 [3:07:44<33:01:54, 7.44s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1851/17840 [3:07:44<33:01:54, 7.44s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9441, 'learning_rate': 9.496437054631829e-05, 'epoch': 2.08} + 10%|███████▌ | 1851/17840 [3:07:44<33:01:54, 7.44s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1851/17840 [3:07:44<33:01:54, 7.44s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1851/17840 [3:07:44<33:01:54, 7.44s/it]g-point operations will not be computed-17 19:46:27,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1852/17840 [3:07:51<32:10:51, 7.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:08,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1852/17840 [3:07:51<32:10:51, 7.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:08,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1852/17840 [3:07:51<32:10:51, 7.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:08,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1853/17840 [3:07:57<31:32:00, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:08,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1853/17840 [3:07:57<31:32:00, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:08,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9406, 'learning_rate': 9.495249406175773e-05, 'epoch': 2.08} +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:18,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:08,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1854/17840 [3:08:04<31:01:20, 6.99s/it]g-point operations will not be computed-17 19:49:08,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1854/17840 [3:08:04<31:01:20, 6.99s/it]g-point operations will not be computed-17 19:49:08,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0405, 'learning_rate': 9.494655581947743e-05, 'epoch': 2.08} + 10%|███████▌ | 1854/17840 [3:08:04<31:01:20, 6.99s/it]g-point operations will not be computed-17 19:49:08,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:26,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:08,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:26,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:08,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9195, 'learning_rate': 9.494061757719715e-05, 'epoch': 2.08} +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:26,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:08,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:26,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:08,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1856/17840 [3:08:17<30:11:51, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1856/17840 [3:08:17<30:11:51, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6935, 'learning_rate': 9.493467933491686e-05, 'epoch': 2.08} + 10%|███████▌ | 1856/17840 [3:08:17<30:11:51, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1857/17840 [3:08:24<29:55:01, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1857/17840 [3:08:24<29:55:01, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:43,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:43,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1858/17840 [3:08:31<29:42:36, 6.69s/it]g-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1858/17840 [3:08:31<29:42:36, 6.69s/it]g-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6979, 'learning_rate': 9.49228028503563e-05, 'epoch': 2.08} +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:51,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:51,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1859/17840 [3:08:37<29:29:25, 6.64s/it]g-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1859/17840 [3:08:37<29:29:25, 6.64s/it]g-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:57,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:49:57,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1860/17840 [3:08:44<29:17:10, 6.60s/it]g-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1860/17840 [3:08:44<29:17:10, 6.60s/it]g-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1860/17840 [3:08:44<29:17:10, 6.60s/it]g-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:05,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:05,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7116, 'learning_rate': 9.490498812351545e-05, 'epoch': 2.09} +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:05,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:12,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:12,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5153, 'learning_rate': 9.489904988123516e-05, 'epoch': 2.09} +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:12,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:12,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:12,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:49:35,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1863/17840 [3:09:03<28:41:39, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:20,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1863/17840 [3:09:03<28:41:39, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:20,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1863/17840 [3:09:03<28:41:39, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:20,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1863/17840 [3:09:03<28:41:39, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:20,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1864/17840 [3:09:09<28:22:55, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:26,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1864/17840 [3:09:09<28:22:55, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:26,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1864/17840 [3:09:09<28:22:55, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:26,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1864/17840 [3:09:09<28:22:55, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:26,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1865/17840 [3:09:15<28:12:06, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:26,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:34,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:26,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:34,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:26,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:34,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:26,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1866/17840 [3:09:21<27:48:01, 6.27s/it]g-point operations will not be computed-17 19:50:26,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:40,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:26,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:40,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:26,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:40,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:26,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1867/17840 [3:09:27<27:25:21, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:44,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1867/17840 [3:09:27<27:25:21, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:44,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1867/17840 [3:09:27<27:25:21, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:44,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1867/17840 [3:09:27<27:25:21, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:44,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1868/17840 [3:09:33<26:59:58, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1868/17840 [3:09:33<26:59:58, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:54,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:54,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9039, 'learning_rate': 9.485748218527316e-05, 'epoch': 2.1} +[WARNING|modeling_utils.py:388] 2022-03-17 19:50:59,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1870/17840 [3:09:45<26:06:42, 5.89s/it]g-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1870/17840 [3:09:45<26:06:42, 5.89s/it]g-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.595, 'learning_rate': 9.485154394299288e-05, 'epoch': 2.1} +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:04,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:04,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1871/17840 [3:09:50<25:44:16, 5.80s/it]g-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:08,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:11,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:11,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5421, 'learning_rate': 9.483966745843232e-05, 'epoch': 2.1} +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:15,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1873/17840 [3:10:01<24:35:55, 5.55s/it]g-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1873/17840 [3:10:01<24:35:55, 5.55s/it]g-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:19,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:21,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:21,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1505, 'learning_rate': 9.482779097387175e-05, 'epoch': 2.1} +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:25,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1875/17840 [3:10:13<26:10:06, 5.90s/it]g-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1875/17840 [3:10:13<26:10:06, 5.90s/it]g-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:31,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:33,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:33,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7305, 'learning_rate': 9.481591448931116e-05, 'epoch': 2.1} +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:37,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:37,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:50:50,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1877/17840 [3:10:22<23:11:13, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:51:39,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:41,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:39,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:41,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:39,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1878/17840 [3:10:26<21:43:52, 4.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:51:43,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:45,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:43,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:45,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:43,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1879/17840 [3:10:30<20:20:13, 4.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:51:47,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1880/17840 [3:10:34<19:01:25, 4.29s/it]g-point operations will not be computed-17 19:51:47,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1880/17840 [3:10:34<19:01:25, 4.29s/it]g-point operations will not be computed-17 19:51:47,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:52,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:50,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1881/17840 [3:10:37<17:32:47, 3.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:51:53,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1881/17840 [3:10:37<17:32:47, 3.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:51:53,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1882/17840 [3:10:40<16:07:45, 3.64s/it]g-point operations will not be computed-17 19:51:53,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1882/17840 [3:10:40<16:07:45, 3.64s/it]g-point operations will not be computed-17 19:51:53,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:57,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:56,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:51:57,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:56,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:00,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:59,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:00,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:51:59,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1884/17840 [3:10:45<13:16:35, 3.00s/it]g-point operations will not be computed-17 19:51:59,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1884/17840 [3:10:45<13:16:35, 3.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:52:02,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1884/17840 [3:10:45<13:16:35, 3.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:52:02,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1885/17840 [3:10:52<19:34:33, 4.42s/it]g-point operations will not be computed-17 19:52:02,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1885/17840 [3:10:52<19:34:33, 4.42s/it]g-point operations will not be computed-17 19:52:02,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1885/17840 [3:10:52<19:34:33, 4.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1885/17840 [3:10:52<19:34:33, 4.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:14,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1886/17840 [3:11:00<23:46:12, 5.36s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1886/17840 [3:11:00<23:46:12, 5.36s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8222, 'learning_rate': 9.475653206650832e-05, 'epoch': 2.11} + 11%|███████▋ | 1886/17840 [3:11:00<23:46:12, 5.36s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1886/17840 [3:11:00<23:46:12, 5.36s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1887/17840 [3:11:07<26:34:20, 6.00s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1887/17840 [3:11:07<26:34:20, 6.00s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9113, 'learning_rate': 9.475059382422803e-05, 'epoch': 2.12} + 11%|███████▋ | 1887/17840 [3:11:07<26:34:20, 6.00s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:30,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:30,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7304, 'learning_rate': 9.474465558194775e-05, 'epoch': 2.12} +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:30,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:30,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1889/17840 [3:11:22<29:25:19, 6.64s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1889/17840 [3:11:22<29:25:19, 6.64s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7148, 'learning_rate': 9.473871733966746e-05, 'epoch': 2.12} + 11%|███████▋ | 1889/17840 [3:11:22<29:25:19, 6.64s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:45,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:45,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6414, 'learning_rate': 9.473277909738718e-05, 'epoch': 2.12} +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:45,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:45,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1891/17840 [3:11:36<30:48:28, 6.95s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1891/17840 [3:11:36<30:48:28, 6.95s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7981, 'learning_rate': 9.472684085510688e-05, 'epoch': 2.12} + 11%|███████▋ | 1891/17840 [3:11:36<30:48:28, 6.95s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:59,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:59,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:59,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7365, 'learning_rate': 9.472090261282662e-05, 'epoch': 2.12} +[WARNING|modeling_utils.py:388] 2022-03-17 19:52:59,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1893/17840 [3:11:51<31:10:49, 7.04s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1893/17840 [3:11:51<31:10:49, 7.04s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9714, 'learning_rate': 9.471496437054632e-05, 'epoch': 2.12} + 11%|███████▋ | 1893/17840 [3:11:51<31:10:49, 7.04s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:13,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:13,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.842, 'learning_rate': 9.470902612826605e-05, 'epoch': 2.12} +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:13,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:13,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:13,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1895/17840 [3:12:05<31:06:56, 7.03s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1895/17840 [3:12:05<31:06:56, 7.03s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:25,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:25,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1896/17840 [3:12:12<31:04:03, 7.01s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1896/17840 [3:12:12<31:04:03, 7.01s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1896/17840 [3:12:12<31:04:03, 7.01s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1896/17840 [3:12:12<31:04:03, 7.01s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1896/17840 [3:12:12<31:04:03, 7.01s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1897/17840 [3:12:19<30:55:57, 6.98s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:38,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1898/17840 [3:12:26<30:50:09, 6.96s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1898/17840 [3:12:26<30:50:09, 6.96s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1898/17840 [3:12:26<30:50:09, 6.96s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:48,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:48,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8398, 'learning_rate': 9.467933491686462e-05, 'epoch': 2.13} +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:48,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:48,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:53:48,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1900/17840 [3:12:42<33:52:17, 7.65s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1900/17840 [3:12:42<33:52:17, 7.65s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1900/17840 [3:12:42<33:52:17, 7.65s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:04,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:04,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7266, 'learning_rate': 9.466745843230405e-05, 'epoch': 2.13} +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:04,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:04,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:04,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1902/17840 [3:12:55<31:59:42, 7.23s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:14,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:14,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:14,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1903/17840 [3:13:02<31:20:29, 7.08s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1903/17840 [3:13:02<31:20:29, 7.08s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:23,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1904/17840 [3:13:09<30:44:41, 6.95s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1904/17840 [3:13:09<30:44:41, 6.95s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5842, 'learning_rate': 9.464964370546318e-05, 'epoch': 2.13} + 11%|███████▊ | 1904/17840 [3:13:09<30:44:41, 6.95s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:31,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:31,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.908, 'learning_rate': 9.46437054631829e-05, 'epoch': 2.14} +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:31,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:31,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:31,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1906/17840 [3:13:22<30:06:09, 6.80s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:41,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:41,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:41,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1907/17840 [3:13:29<29:41:59, 6.71s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:47,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:47,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1908/17840 [3:13:35<29:22:55, 6.64s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1908/17840 [3:13:35<29:22:55, 6.64s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8471, 'learning_rate': 9.462589073634205e-05, 'epoch': 2.14} + 11%|███████▊ | 1908/17840 [3:13:35<29:22:55, 6.64s/it]g-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:57,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:57,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6454, 'learning_rate': 9.461995249406176e-05, 'epoch': 2.14} +[WARNING|modeling_utils.py:388] 2022-03-17 19:54:57,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:04,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:04,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7157, 'learning_rate': 9.461401425178148e-05, 'epoch': 2.14} +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:04,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:10,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:10,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6247, 'learning_rate': 9.46080760095012e-05, 'epoch': 2.14} +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:10,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:10,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:10,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:52:10,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1912/17840 [3:14:01<28:40:01, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:18,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1912/17840 [3:14:01<28:40:01, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:18,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1912/17840 [3:14:01<28:40:01, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:18,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1912/17840 [3:14:01<28:40:01, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:18,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1913/17840 [3:14:07<28:18:07, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:24,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1913/17840 [3:14:07<28:18:07, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:24,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1913/17840 [3:14:07<28:18:07, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:24,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1913/17840 [3:14:07<28:18:07, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:24,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1914/17840 [3:14:13<27:57:28, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:30,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1914/17840 [3:14:13<27:57:28, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:30,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:35,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:30,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:35,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:30,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6152, 'learning_rate': 9.458432304038005e-05, 'epoch': 2.15} +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:35,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:30,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:35,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:30,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:35,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:30,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1916/17840 [3:14:25<27:09:00, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:42,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1916/17840 [3:14:25<27:09:00, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:55:42,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:46,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:42,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:46,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:42,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.64, 'learning_rate': 9.457244655581948e-05, 'epoch': 2.15} +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:51,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:42,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1918/17840 [3:14:37<26:21:22, 5.96s/it]g-point operations will not be computed-17 19:55:42,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1918/17840 [3:14:37<26:21:22, 5.96s/it]g-point operations will not be computed-17 19:55:42,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7589, 'learning_rate': 9.45665083135392e-05, 'epoch': 2.15} +[WARNING|modeling_utils.py:388] 2022-03-17 19:55:56,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:42,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1919/17840 [3:14:42<25:57:31, 5.87s/it]g-point operations will not be computed-17 19:55:42,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1919/17840 [3:14:42<25:57:31, 5.87s/it]g-point operations will not be computed-17 19:55:42,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:01,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:42,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:01,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:55:42,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1920/17840 [3:14:48<25:34:09, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:56:05,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1920/17840 [3:14:48<25:34:09, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:56:05,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9507, 'learning_rate': 9.455463182897863e-05, 'epoch': 2.15} +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:09,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:05,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:09,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:05,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6603, 'learning_rate': 9.454869358669835e-05, 'epoch': 2.15} +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:13,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:05,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1922/17840 [3:14:59<24:36:05, 5.56s/it]g-point operations will not be computed-17 19:56:05,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1922/17840 [3:14:59<24:36:05, 5.56s/it]g-point operations will not be computed-17 19:56:05,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:17,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:05,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:17,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:05,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:17,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:05,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1923/17840 [3:15:04<23:57:04, 5.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:23,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1924/17840 [3:15:09<23:16:23, 5.26s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1924/17840 [3:15:09<23:16:23, 5.26s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:27,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:31,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:31,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:33,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:35,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:35,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:37,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:39,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:39,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:41,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:43,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:43,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:45,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:46,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:46,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:50,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:50,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:51,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:52,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:52,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:55,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:55,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:57,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:57,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:59,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:56:59,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4785, 'learning_rate': 9.447149643705464e-05, 'epoch': 2.17} +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:03,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:03,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:07,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:07,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9672, 'learning_rate': 9.446555819477435e-05, 'epoch': 2.17} +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:11,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:11,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:15,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:15,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8329, 'learning_rate': 9.445961995249407e-05, 'epoch': 2.17} +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:15,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:15,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1937/17840 [3:16:07<26:17:12, 5.95s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1937/17840 [3:16:07<26:17:12, 5.95s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6175, 'learning_rate': 9.445368171021378e-05, 'epoch': 2.17} + 11%|███████▉ | 1937/17840 [3:16:07<26:17:12, 5.95s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:30,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:30,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8628, 'learning_rate': 9.44477434679335e-05, 'epoch': 2.17} +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:30,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:30,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:30,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1939/17840 [3:16:22<29:42:55, 6.73s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1939/17840 [3:16:22<29:42:55, 6.73s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1939/17840 [3:16:22<29:42:55, 6.73s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1939/17840 [3:16:22<29:42:55, 6.73s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1939/17840 [3:16:22<29:42:55, 6.73s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1940/17840 [3:16:29<30:29:02, 6.90s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:48,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:48,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:57:48,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1941/17840 [3:16:37<31:02:26, 7.03s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1941/17840 [3:16:37<31:02:26, 7.03s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1941/17840 [3:16:37<31:02:26, 7.03s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1941/17840 [3:16:37<31:02:26, 7.03s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1941/17840 [3:16:37<31:02:26, 7.03s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1942/17840 [3:16:44<31:16:38, 7.08s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1942/17840 [3:16:44<31:16:38, 7.08s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1942/17840 [3:16:44<31:16:38, 7.08s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1942/17840 [3:16:44<31:16:38, 7.08s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1942/17840 [3:16:44<31:16:38, 7.08s/it]g-point operations will not be computed-17 19:56:21,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1943/17840 [3:16:51<31:23:08, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1943/17840 [3:16:51<31:23:08, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1943/17840 [3:16:51<31:23:08, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1943/17840 [3:16:51<31:23:08, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1944/17840 [3:16:58<31:25:23, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1944/17840 [3:16:58<31:25:23, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1944/17840 [3:16:58<31:25:23, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:58:21,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:58:21,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9108, 'learning_rate': 9.440617577197151e-05, 'epoch': 2.18} +[WARNING|modeling_utils.py:388] 2022-03-17 19:58:21,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:58:21,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:58:21,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1946/17840 [3:17:12<31:15:57, 7.08s/it]g-point operations will not be computed-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1946/17840 [3:17:12<31:15:57, 7.08s/it]g-point operations will not be computed-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:58:33,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1947/17840 [3:17:19<31:13:10, 7.07s/it]g-point operations will not be computed-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1947/17840 [3:17:19<31:13:10, 7.07s/it]g-point operations will not be computed-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5667, 'learning_rate': 9.439429928741093e-05, 'epoch': 2.18} + 11%|███████▉ | 1947/17840 [3:17:19<31:13:10, 7.07s/it]g-point operations will not be computed-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1947/17840 [3:17:19<31:13:10, 7.07s/it]g-point operations will not be computed-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1947/17840 [3:17:19<31:13:10, 7.07s/it]g-point operations will not be computed-17 19:58:08,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1948/17840 [3:17:26<30:59:30, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1948/17840 [3:17:26<30:59:30, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1948/17840 [3:17:26<30:59:30, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1948/17840 [3:17:26<30:59:30, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1949/17840 [3:17:33<30:55:52, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1949/17840 [3:17:33<30:55:52, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1949/17840 [3:17:33<30:55:52, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1949/17840 [3:17:33<30:55:52, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1949/17840 [3:17:33<30:55:52, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1950/17840 [3:17:42<33:54:31, 7.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:01,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:01,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:01,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1951/17840 [3:17:49<32:49:10, 7.44s/it]g-point operations will not be computed-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1951/17840 [3:17:49<32:49:10, 7.44s/it]g-point operations will not be computed-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:10,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1952/17840 [3:17:56<32:05:35, 7.27s/it]g-point operations will not be computed-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1952/17840 [3:17:56<32:05:35, 7.27s/it]g-point operations will not be computed-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4937, 'learning_rate': 9.436460807600951e-05, 'epoch': 2.19} + 11%|███████▉ | 1952/17840 [3:17:56<32:05:35, 7.27s/it]g-point operations will not be computed-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1952/17840 [3:17:56<32:05:35, 7.27s/it]g-point operations will not be computed-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1952/17840 [3:17:56<32:05:35, 7.27s/it]g-point operations will not be computed-17 19:58:43,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1953/17840 [3:18:03<31:26:46, 7.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1953/17840 [3:18:03<31:26:46, 7.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1953/17840 [3:18:03<31:26:46, 7.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1954/17840 [3:18:10<30:59:15, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1954/17840 [3:18:10<30:59:15, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:29,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:29,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1955/17840 [3:18:16<30:28:41, 6.91s/it]g-point operations will not be computed-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1955/17840 [3:18:16<30:28:41, 6.91s/it]g-point operations will not be computed-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6357, 'learning_rate': 9.434679334916865e-05, 'epoch': 2.19} + 11%|███████▉ | 1955/17840 [3:18:16<30:28:41, 6.91s/it]g-point operations will not be computed-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:38,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:38,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6001, 'learning_rate': 9.434085510688837e-05, 'epoch': 2.19} +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:38,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:38,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:38,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:20,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1957/17840 [3:18:29<29:41:38, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1957/17840 [3:18:29<29:41:38, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1957/17840 [3:18:29<29:41:38, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1957/17840 [3:18:29<29:41:38, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1958/17840 [3:18:36<29:27:29, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:55,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 19:59:55,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1959/17840 [3:18:42<29:10:38, 6.61s/it]g-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1959/17840 [3:18:42<29:10:38, 6.61s/it]g-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:01,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:01,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1960/17840 [3:18:49<28:55:07, 6.56s/it]g-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1960/17840 [3:18:49<28:55:07, 6.56s/it]g-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8528, 'learning_rate': 9.431710213776722e-05, 'epoch': 2.2} +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:09,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1961/17840 [3:18:55<28:47:46, 6.53s/it]g-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1961/17840 [3:18:55<28:47:46, 6.53s/it]g-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4413, 'learning_rate': 9.431116389548694e-05, 'epoch': 2.2} +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:16,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1962/17840 [3:19:02<28:33:44, 6.48s/it]g-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1962/17840 [3:19:02<28:33:44, 6.48s/it]g-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8169, 'learning_rate': 9.430522565320665e-05, 'epoch': 2.2} + 11%|████████ | 1962/17840 [3:19:02<28:33:44, 6.48s/it]g-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:23,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:23,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6864, 'learning_rate': 9.429928741092637e-05, 'epoch': 2.2} +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:23,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:30,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:30,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.69, 'learning_rate': 9.429334916864608e-05, 'epoch': 2.2} +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:30,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:36,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:36,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6674, 'learning_rate': 9.428741092636581e-05, 'epoch': 2.2} +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:36,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:42,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:42,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4813, 'learning_rate': 9.428147268408552e-05, 'epoch': 2.2} +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:42,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:48,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:48,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5167, 'learning_rate': 9.427553444180524e-05, 'epoch': 2.21} +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:52,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:52,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1968/17840 [3:19:38<26:49:25, 6.08s/it]g-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1968/17840 [3:19:38<26:49:25, 6.08s/it]g-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:58,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:00:58,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1969/17840 [3:19:44<26:23:34, 5.99s/it]g-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:02,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:02,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:02,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 19:59:47,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1970/17840 [3:19:50<25:57:13, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:07,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1970/17840 [3:19:50<25:57:13, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:07,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:11,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:07,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:11,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:07,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.65, 'learning_rate': 9.425178147268409e-05, 'epoch': 2.21} +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:15,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:07,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:15,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:07,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1972/17840 [3:20:01<25:09:59, 5.71s/it]g-point operations will not be computed-17 20:01:07,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:19,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:07,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:19,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:07,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:19,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:07,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1973/17840 [3:20:06<24:29:54, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:23,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1973/17840 [3:20:06<24:29:54, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:23,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1973/17840 [3:20:06<24:29:54, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:23,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:27,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:23,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:29,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:23,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:29,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:23,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:29,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:23,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1975/17840 [3:20:18<25:49:55, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:35,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:37,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:35,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:37,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:35,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1976/17840 [3:20:23<24:06:37, 5.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:39,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:41,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:39,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:41,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:39,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1977/17840 [3:20:27<22:29:10, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:43,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:45,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:43,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:45,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:43,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1978/17840 [3:20:31<21:00:48, 4.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:47,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:49,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:47,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:49,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:47,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1979/17840 [3:20:34<19:27:25, 4.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:51,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:52,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:51,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:01:52,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:01:51,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1980/17840 [3:20:38<17:54:39, 4.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:54,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1980/17840 [3:20:38<17:54:39, 4.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:54,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1981/17840 [3:20:41<16:29:23, 3.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:57,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1981/17840 [3:20:41<16:29:23, 3.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:01:57,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1982/17840 [3:20:43<14:59:05, 3.40s/it]g-point operations will not be computed-17 20:01:57,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1982/17840 [3:20:43<14:59:05, 3.40s/it]g-point operations will not be computed-17 20:01:57,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1983/17840 [3:20:45<13:31:47, 3.07s/it]g-point operations will not be computed-17 20:01:59,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1984/17840 [3:20:48<12:10:25, 2.76s/it]g-point operations will not be computed-17 20:02:02,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1984/17840 [3:20:48<12:10:25, 2.76s/it]g-point operations will not be computed-17 20:02:02,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1984/17840 [3:20:48<12:10:25, 2.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:02:05,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1984/17840 [3:20:48<12:10:25, 2.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:02:05,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:09,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:05,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:09,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:05,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1985/17840 [3:20:55<18:48:38, 4.27s/it]g-point operations will not be computed-17 20:02:05,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1985/17840 [3:20:55<18:48:38, 4.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1985/17840 [3:20:55<18:48:38, 4.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:17,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:17,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1986/17840 [3:21:03<23:14:41, 5.28s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1986/17840 [3:21:03<23:14:41, 5.28s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1986/17840 [3:21:03<23:14:41, 5.28s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1986/17840 [3:21:03<23:14:41, 5.28s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1987/17840 [3:21:10<26:10:58, 5.95s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1987/17840 [3:21:10<26:10:58, 5.95s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:30,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:30,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1988/17840 [3:21:18<27:59:30, 6.36s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1988/17840 [3:21:18<27:59:30, 6.36s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8886, 'learning_rate': 9.415083135391924e-05, 'epoch': 2.23} + 11%|████████▏ | 1988/17840 [3:21:18<27:59:30, 6.36s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1988/17840 [3:21:18<27:59:30, 6.36s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1989/17840 [3:21:25<29:09:37, 6.62s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1989/17840 [3:21:25<29:09:37, 6.62s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.715, 'learning_rate': 9.414489311163895e-05, 'epoch': 2.23} + 11%|████████▏ | 1989/17840 [3:21:25<29:09:37, 6.62s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:48,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:48,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7238, 'learning_rate': 9.413895486935867e-05, 'epoch': 2.23} +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:48,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:48,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:02:48,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1991/17840 [3:21:40<30:31:45, 6.93s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1991/17840 [3:21:40<30:31:45, 6.93s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:00,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1992/17840 [3:21:47<30:56:08, 7.03s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1992/17840 [3:21:47<30:56:08, 7.03s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9504, 'learning_rate': 9.412707838479811e-05, 'epoch': 2.23} + 11%|████████▏ | 1992/17840 [3:21:47<30:56:08, 7.03s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1992/17840 [3:21:47<30:56:08, 7.03s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1992/17840 [3:21:47<30:56:08, 7.03s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1993/17840 [3:21:54<31:01:53, 7.05s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1993/17840 [3:21:54<31:01:53, 7.05s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:15,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1994/17840 [3:22:01<31:10:01, 7.08s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1994/17840 [3:22:01<31:10:01, 7.08s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.666, 'learning_rate': 9.411520190023754e-05, 'epoch': 2.24} + 11%|████████▏ | 1994/17840 [3:22:01<31:10:01, 7.08s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1994/17840 [3:22:01<31:10:01, 7.08s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1994/17840 [3:22:01<31:10:01, 7.08s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1995/17840 [3:22:08<31:11:28, 7.09s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1995/17840 [3:22:08<31:11:28, 7.09s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:29,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1996/17840 [3:22:15<31:00:50, 7.05s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1996/17840 [3:22:15<31:00:50, 7.05s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7099, 'learning_rate': 9.410332541567697e-05, 'epoch': 2.24} + 11%|████████▏ | 1996/17840 [3:22:15<31:00:50, 7.05s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1996/17840 [3:22:15<31:00:50, 7.05s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1996/17840 [3:22:15<31:00:50, 7.05s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1997/17840 [3:22:22<31:04:55, 7.06s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:41,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:41,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:03:41,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1998/17840 [3:22:29<30:54:03, 7.02s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1998/17840 [3:22:29<30:54:03, 7.02s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1998/17840 [3:22:29<30:54:03, 7.02s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1998/17840 [3:22:29<30:54:03, 7.02s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1998/17840 [3:22:29<30:54:03, 7.02s/it]g-point operations will not be computed-17 20:02:13,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1999/17840 [3:22:36<30:39:30, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:03:53,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1999/17840 [3:22:36<30:39:30, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:03:53,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1999/17840 [3:22:36<30:39:30, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:03:53,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1999/17840 [3:22:36<30:39:30, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:03:53,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2000/17840 [3:22:45<33:37:03, 7.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:03:53,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2000/17840 [3:22:45<33:37:03, 7.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:03:53,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2000/17840 [3:22:45<33:37:03, 7.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:03:53,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:07,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:53,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:07,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:53,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7284, 'learning_rate': 9.407363420427554e-05, 'epoch': 2.24} +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:07,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:53,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:07,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:53,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:07,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:03:53,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2002/17840 [3:22:59<31:42:20, 7.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2002/17840 [3:22:59<31:42:20, 7.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2002/17840 [3:22:59<31:42:20, 7.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2002/17840 [3:22:59<31:42:20, 7.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2003/17840 [3:23:05<31:00:33, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:24,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:24,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2004/17840 [3:23:12<30:39:54, 6.97s/it]g-point operations will not be computed-17 20:04:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2004/17840 [3:23:12<30:39:54, 6.97s/it]g-point operations will not be computed-17 20:04:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7331, 'learning_rate': 9.405581947743467e-05, 'epoch': 2.25} + 11%|████████▏ | 2004/17840 [3:23:12<30:39:54, 6.97s/it]g-point operations will not be computed-17 20:04:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2004/17840 [3:23:12<30:39:54, 6.97s/it]g-point operations will not be computed-17 20:04:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2004/17840 [3:23:12<30:39:54, 6.97s/it]g-point operations will not be computed-17 20:04:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2005/17840 [3:23:19<30:16:41, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2005/17840 [3:23:19<30:16:41, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2005/17840 [3:23:19<30:16:41, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2005/17840 [3:23:19<30:16:41, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2006/17840 [3:23:26<30:01:33, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2006/17840 [3:23:26<30:01:33, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:46,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:46,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2007/17840 [3:23:32<29:39:19, 6.74s/it]g-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2007/17840 [3:23:32<29:39:19, 6.74s/it]g-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:04:52,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2008/17840 [3:23:39<29:15:22, 6.65s/it]g-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2008/17840 [3:23:39<29:15:22, 6.65s/it]g-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9321, 'learning_rate': 9.403206650831354e-05, 'epoch': 2.25} + 11%|████████▏ | 2008/17840 [3:23:39<29:15:22, 6.65s/it]g-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:01,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:01,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8822, 'learning_rate': 9.402612826603325e-05, 'epoch': 2.25} +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:01,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:07,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:07,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.952, 'learning_rate': 9.402019002375297e-05, 'epoch': 2.25} +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:07,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:07,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:07,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:04:36,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2011/17840 [3:23:58<28:47:06, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:05:15,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2011/17840 [3:23:58<28:47:06, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:05:15,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2011/17840 [3:23:58<28:47:06, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:05:15,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2012/17840 [3:24:04<28:31:10, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2012/17840 [3:24:04<28:31:10, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7495, 'learning_rate': 9.400831353919241e-05, 'epoch': 2.26} + 11%|████████▏ | 2012/17840 [3:24:04<28:31:10, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2013/17840 [3:24:11<28:20:19, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2013/17840 [3:24:11<28:20:19, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:29,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:29,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2014/17840 [3:24:17<28:06:57, 6.40s/it]g-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2014/17840 [3:24:17<28:06:57, 6.40s/it]g-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:36,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:36,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2015/17840 [3:24:23<27:53:36, 6.35s/it]g-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2015/17840 [3:24:23<27:53:36, 6.35s/it]g-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:42,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:42,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2016/17840 [3:24:29<27:36:44, 6.28s/it]g-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2016/17840 [3:24:29<27:36:44, 6.28s/it]g-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:48,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:48,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2017/17840 [3:24:36<27:22:06, 6.23s/it]g-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2017/17840 [3:24:36<27:22:06, 6.23s/it]g-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:54,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:05:54,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2018/17840 [3:24:41<26:58:12, 6.14s/it]g-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2018/17840 [3:24:41<26:58:12, 6.14s/it]g-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:00,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:00,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:00,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:05:22,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2019/17840 [3:24:47<26:26:53, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:06:04,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2019/17840 [3:24:47<26:26:53, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:06:04,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:08,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:04,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:08,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:04,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7199, 'learning_rate': 9.396080760095012e-05, 'epoch': 2.26} +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:13,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:04,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2021/17840 [3:24:58<25:35:28, 5.82s/it]g-point operations will not be computed-17 20:06:04,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2021/17840 [3:24:58<25:35:28, 5.82s/it]g-point operations will not be computed-17 20:06:04,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7737, 'learning_rate': 9.395486935866984e-05, 'epoch': 2.27} +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:18,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:04,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2022/17840 [3:25:04<24:57:18, 5.68s/it]g-point operations will not be computed-17 20:06:04,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2022/17840 [3:25:04<24:57:18, 5.68s/it]g-point operations will not be computed-17 20:06:04,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:22,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:04,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:24,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:04,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:24,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:04,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8498, 'learning_rate': 9.394299287410927e-05, 'epoch': 2.27} +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:28,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:04,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2024/17840 [3:25:14<23:31:14, 5.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2024/17840 [3:25:14<23:31:14, 5.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8125, 'learning_rate': 9.393705463182899e-05, 'epoch': 2.27} + 11%|████████▎ | 2024/17840 [3:25:14<23:31:14, 5.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2025/17840 [3:25:21<25:06:24, 5.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2025/17840 [3:25:21<25:06:24, 5.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:38,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:41,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:41,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:43,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:45,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:45,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:49,108 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:49,108 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:50,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:52,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:52,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:54,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:57,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:57,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:58,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:06:58,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:01,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:01,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:03,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:03,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:05,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:05,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:05,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:09,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:09,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:09,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:13,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:13,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:17,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:17,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:17,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:21,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:21,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:21,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:21,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:21,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2037/17840 [3:26:13<26:22:29, 6.01s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2037/17840 [3:26:13<26:22:29, 6.01s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2037/17840 [3:26:13<26:22:29, 6.01s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2037/17840 [3:26:13<26:22:29, 6.01s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2037/17840 [3:26:13<26:22:29, 6.01s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2038/17840 [3:26:21<28:20:02, 6.46s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:40,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:40,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:40,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2039/17840 [3:26:28<29:36:05, 6.74s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2039/17840 [3:26:28<29:36:05, 6.74s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2039/17840 [3:26:28<29:36:05, 6.74s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2039/17840 [3:26:28<29:36:05, 6.74s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2039/17840 [3:26:28<29:36:05, 6.74s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2040/17840 [3:26:35<30:25:56, 6.93s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2040/17840 [3:26:35<30:25:56, 6.93s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2040/17840 [3:26:35<30:25:56, 6.93s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:58,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:58,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5708, 'learning_rate': 9.383610451306414e-05, 'epoch': 2.29} +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:58,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:58,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:07:58,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2042/17840 [3:26:50<31:18:00, 7.13s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2042/17840 [3:26:50<31:18:00, 7.13s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2042/17840 [3:26:50<31:18:00, 7.13s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2042/17840 [3:26:50<31:18:00, 7.13s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2042/17840 [3:26:50<31:18:00, 7.13s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2043/17840 [3:26:57<31:27:31, 7.17s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:16,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:16,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:16,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2044/17840 [3:27:05<31:33:35, 7.19s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2044/17840 [3:27:05<31:33:35, 7.19s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2044/17840 [3:27:05<31:33:35, 7.19s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2044/17840 [3:27:05<31:33:35, 7.19s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2044/17840 [3:27:05<31:33:35, 7.19s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2045/17840 [3:27:12<31:39:06, 7.21s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2045/17840 [3:27:12<31:39:06, 7.21s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:33,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:33,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2046/17840 [3:27:19<31:24:50, 7.16s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2046/17840 [3:27:19<31:24:50, 7.16s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2046/17840 [3:27:19<31:24:50, 7.16s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2046/17840 [3:27:19<31:24:50, 7.16s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2046/17840 [3:27:19<31:24:50, 7.16s/it]g-point operations will not be computed-17 20:06:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2047/17840 [3:27:26<31:10:13, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:47,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:47,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2048/17840 [3:27:33<31:04:53, 7.09s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2048/17840 [3:27:33<31:04:53, 7.09s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2048/17840 [3:27:33<31:04:53, 7.09s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2048/17840 [3:27:33<31:04:53, 7.09s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2048/17840 [3:27:33<31:04:53, 7.09s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2049/17840 [3:27:40<31:02:34, 7.08s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:08:59,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2050/17840 [3:27:49<33:50:07, 7.71s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2050/17840 [3:27:49<33:50:07, 7.71s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2050/17840 [3:27:49<33:50:07, 7.71s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:11,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:11,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7318, 'learning_rate': 9.377672209026129e-05, 'epoch': 2.3} +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:11,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:11,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:11,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2052/17840 [3:28:03<31:49:38, 7.26s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2052/17840 [3:28:03<31:49:38, 7.26s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:23,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2053/17840 [3:28:10<31:15:11, 7.13s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2053/17840 [3:28:10<31:15:11, 7.13s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7634, 'learning_rate': 9.376484560570071e-05, 'epoch': 2.3} + 12%|████████▍ | 2053/17840 [3:28:10<31:15:11, 7.13s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:32,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:32,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6269, 'learning_rate': 9.375890736342043e-05, 'epoch': 2.3} +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:32,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:32,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:32,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2055/17840 [3:28:23<30:30:56, 6.96s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:42,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:42,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2056/17840 [3:28:30<30:07:00, 6.87s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2056/17840 [3:28:30<30:07:00, 6.87s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6545, 'learning_rate': 9.374703087885986e-05, 'epoch': 2.3} +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:50,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2057/17840 [3:28:36<29:49:23, 6.80s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2057/17840 [3:28:36<29:49:23, 6.80s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.635, 'learning_rate': 9.374109263657957e-05, 'epoch': 2.31} + 12%|████████▍ | 2057/17840 [3:28:36<29:49:23, 6.80s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:58,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:58,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.529, 'learning_rate': 9.373515439429929e-05, 'epoch': 2.31} +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:58,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:58,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:09:58,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2059/17840 [3:28:50<29:14:53, 6.67s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:08,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:08,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2060/17840 [3:28:56<28:55:42, 6.60s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2060/17840 [3:28:56<28:55:42, 6.60s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7355, 'learning_rate': 9.372327790973873e-05, 'epoch': 2.31} +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:16,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2061/17840 [3:29:03<28:50:02, 6.58s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2061/17840 [3:29:03<28:50:02, 6.58s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8496, 'learning_rate': 9.371733966745844e-05, 'epoch': 2.31} +[WARNING|modeling_utils.py:388] 2022-03-17 20:10:23,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2062/17840 [3:29:09<28:38:17, 6.53s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2062/17840 [3:29:09<28:38:17, 6.53s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8205, 'learning_rate': 9.371140142517814e-05, 'epoch': 2.31} + 12%|████████▍ | 2062/17840 [3:29:09<28:38:17, 6.53s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2062/17840 [3:29:09<28:38:17, 6.53s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2062/17840 [3:29:09<28:38:17, 6.53s/it]g-point operations will not be computed-17 20:08:43,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2063/17840 [3:29:15<28:29:00, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:33,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2063/17840 [3:29:15<28:29:00, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:33,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2063/17840 [3:29:15<28:29:00, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:33,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2063/17840 [3:29:15<28:29:00, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:33,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2064/17840 [3:29:22<28:09:42, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:39,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2064/17840 [3:29:22<28:09:42, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:39,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2064/17840 [3:29:22<28:09:42, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:39,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2064/17840 [3:29:22<28:09:42, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:39,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2065/17840 [3:29:28<27:57:52, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:45,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2065/17840 [3:29:28<27:57:52, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:45,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2065/17840 [3:29:28<27:57:52, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:45,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2065/17840 [3:29:28<27:57:52, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:45,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2066/17840 [3:29:34<27:38:36, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:51,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2066/17840 [3:29:34<27:38:36, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:51,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2066/17840 [3:29:34<27:38:36, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:51,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2066/17840 [3:29:34<27:38:36, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:51,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2067/17840 [3:29:40<27:27:13, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:57,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2067/17840 [3:29:40<27:27:13, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:57,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2067/17840 [3:29:40<27:27:13, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:57,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2067/17840 [3:29:40<27:27:13, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:10:57,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2068/17840 [3:29:46<26:57:38, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2068/17840 [3:29:46<26:57:38, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:07,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:07,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6845, 'learning_rate': 9.366983372921616e-05, 'epoch': 2.32} +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:07,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:13,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:13,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5578, 'learning_rate': 9.366389548693587e-05, 'epoch': 2.32} +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:17,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2071/17840 [3:30:03<25:43:57, 5.87s/it]g-point operations will not be computed-17 20:11:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2071/17840 [3:30:03<25:43:57, 5.87s/it]g-point operations will not be computed-17 20:11:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:22,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:22,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:22,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2072/17840 [3:30:09<25:13:22, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:26,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2072/17840 [3:30:09<25:13:22, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:26,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:30,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:26,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:30,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:26,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:32,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:26,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:32,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:26,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2074/17840 [3:30:19<23:52:59, 5.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2074/17840 [3:30:19<23:52:59, 5.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:38,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2075/17840 [3:30:26<25:56:54, 5.93s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2075/17840 [3:30:26<25:56:54, 5.93s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:44,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:46,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:46,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:48,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:51,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:51,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:53,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:55,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:55,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:56,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:56,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:11:58,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:00,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:00,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:03,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:03,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:04,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:04,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:07,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:08,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:08,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:10,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:10,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:11,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:11,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:15,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:15,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:15,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:19,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:19,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:23,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:23,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:27,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:27,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:27,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:27,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:27,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2087/17840 [3:31:19<26:02:31, 5.95s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2087/17840 [3:31:19<26:02:31, 5.95s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2087/17840 [3:31:19<26:02:31, 5.95s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2087/17840 [3:31:19<26:02:31, 5.95s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2087/17840 [3:31:19<26:02:31, 5.95s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2088/17840 [3:31:26<27:57:15, 6.39s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:45,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:45,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:12:45,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2089/17840 [3:31:34<29:13:09, 6.68s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2089/17840 [3:31:34<29:13:09, 6.68s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2089/17840 [3:31:34<29:13:09, 6.68s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2089/17840 [3:31:34<29:13:09, 6.68s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2089/17840 [3:31:34<29:13:09, 6.68s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2090/17840 [3:31:41<30:04:44, 6.88s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2090/17840 [3:31:41<30:04:44, 6.88s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2090/17840 [3:31:41<30:04:44, 6.88s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:04,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:04,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6725, 'learning_rate': 9.353919239904988e-05, 'epoch': 2.34} +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:04,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:04,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:04,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2092/17840 [3:31:55<30:53:58, 7.06s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2092/17840 [3:31:55<30:53:58, 7.06s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2092/17840 [3:31:55<30:53:58, 7.06s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:18,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:18,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0596, 'learning_rate': 9.352731591448931e-05, 'epoch': 2.35} +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:18,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:18,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:18,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2094/17840 [3:32:10<31:09:39, 7.12s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2094/17840 [3:32:10<31:09:39, 7.12s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2094/17840 [3:32:10<31:09:39, 7.12s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:32,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:32,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8553, 'learning_rate': 9.351543942992874e-05, 'epoch': 2.35} +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:32,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:32,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:32,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2096/17840 [3:32:24<30:52:32, 7.06s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2096/17840 [3:32:24<30:52:32, 7.06s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:13:45,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2097/17840 [3:32:31<30:49:36, 7.05s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2097/17840 [3:32:31<30:49:36, 7.05s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1884, 'learning_rate': 9.350356294536817e-05, 'epoch': 2.35} + 12%|████████▌ | 2097/17840 [3:32:31<30:49:36, 7.05s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2097/17840 [3:32:31<30:49:36, 7.05s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2097/17840 [3:32:31<30:49:36, 7.05s/it]g-point operations will not be computed-17 20:11:36,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2098/17840 [3:32:38<30:37:59, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2098/17840 [3:32:38<30:37:59, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2098/17840 [3:32:38<30:37:59, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2098/17840 [3:32:38<30:37:59, 7.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2099/17840 [3:32:44<30:21:52, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2099/17840 [3:32:44<30:21:52, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2099/17840 [3:32:44<30:21:52, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2099/17840 [3:32:44<30:21:52, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2100/17840 [3:32:54<33:23:48, 7.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2100/17840 [3:32:54<33:23:48, 7.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.718, 'learning_rate': 9.348574821852733e-05, 'epoch': 2.35} + 12%|████████▌ | 2100/17840 [3:32:54<33:23:48, 7.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2100/17840 [3:32:54<33:23:48, 7.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2100/17840 [3:32:54<33:23:48, 7.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2101/17840 [3:33:01<32:28:00, 7.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2101/17840 [3:33:01<32:28:00, 7.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:21,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2102/17840 [3:33:07<31:34:46, 7.22s/it]g-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2102/17840 [3:33:07<31:34:46, 7.22s/it]g-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8097, 'learning_rate': 9.347387173396675e-05, 'epoch': 2.36} + 12%|████████▌ | 2102/17840 [3:33:07<31:34:46, 7.22s/it]g-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:30,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:30,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.762, 'learning_rate': 9.346793349168646e-05, 'epoch': 2.36} +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:30,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:30,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:30,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2104/17840 [3:33:21<30:20:55, 6.94s/it]g-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:40,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:40,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:40,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2105/17840 [3:33:27<29:56:03, 6.85s/it]g-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2105/17840 [3:33:27<29:56:03, 6.85s/it]g-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:48,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2106/17840 [3:33:34<29:35:42, 6.77s/it]g-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2106/17840 [3:33:34<29:35:42, 6.77s/it]g-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7981, 'learning_rate': 9.345011876484561e-05, 'epoch': 2.36} + 12%|████████▌ | 2106/17840 [3:33:34<29:35:42, 6.77s/it]g-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:56,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:56,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5818, 'learning_rate': 9.344418052256533e-05, 'epoch': 2.36} +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:56,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:56,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:14:56,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:13:55,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2108/17840 [3:33:47<29:06:50, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2108/17840 [3:33:47<29:06:50, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2108/17840 [3:33:47<29:06:50, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2108/17840 [3:33:47<29:06:50, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2109/17840 [3:33:54<28:50:27, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:12,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:12,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2110/17840 [3:34:00<28:38:20, 6.55s/it]g-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2110/17840 [3:34:00<28:38:20, 6.55s/it]g-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7066, 'learning_rate': 9.342636579572446e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:20,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2111/17840 [3:34:06<28:25:39, 6.51s/it]g-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2111/17840 [3:34:06<28:25:39, 6.51s/it]g-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7437, 'learning_rate': 9.342042755344418e-05, 'epoch': 2.37} + 12%|████████▋ | 2111/17840 [3:34:06<28:25:39, 6.51s/it]g-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:28,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:28,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6526, 'learning_rate': 9.34144893111639e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:28,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:35,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:35,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6724, 'learning_rate': 9.340855106888361e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:35,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:41,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:41,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7284, 'learning_rate': 9.340261282660333e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:41,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:47,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:47,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6593, 'learning_rate': 9.339667458432304e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:47,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:53,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:53,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6881, 'learning_rate': 9.339073634204276e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:53,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:59,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:15:59,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4743, 'learning_rate': 9.338479809976247e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:04,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2118/17840 [3:34:50<26:39:37, 6.10s/it]g-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2118/17840 [3:34:50<26:39:37, 6.10s/it]g-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5646, 'learning_rate': 9.33788598574822e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:09,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2119/17840 [3:34:55<26:20:36, 6.03s/it]g-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2119/17840 [3:34:55<26:20:36, 6.03s/it]g-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:14,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:14,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:15:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2120/17840 [3:35:01<25:52:05, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2120/17840 [3:35:01<25:52:05, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8123, 'learning_rate': 9.336698337292163e-05, 'epoch': 2.38} +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:22,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:22,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:22,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:26,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2122/17840 [3:35:12<24:55:51, 5.71s/it]g-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2122/17840 [3:35:12<24:55:51, 5.71s/it]g-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:30,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:30,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2123/17840 [3:35:17<24:24:26, 5.59s/it]g-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2123/17840 [3:35:17<24:24:26, 5.59s/it]g-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:35,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:35,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:38,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:38,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:42,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:42,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:18,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2125/17840 [3:35:29<25:36:14, 5.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:16:46,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:48,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:46,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:48,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:46,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2126/17840 [3:35:34<23:53:24, 5.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:16:51,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:53,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:51,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:53,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:51,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2127/17840 [3:35:38<22:14:12, 5.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:16:55,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:57,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:55,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:16:57,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:55,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2128/17840 [3:35:42<20:42:06, 4.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:16:59,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:00,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:16:59,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2129/17840 [3:35:46<19:10:23, 4.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:17:02,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2129/17840 [3:35:46<19:10:23, 4.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:17:02,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2130/17840 [3:35:49<17:38:21, 4.04s/it]g-point operations will not be computed-17 20:17:02,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2130/17840 [3:35:49<17:38:21, 4.04s/it]g-point operations will not be computed-17 20:17:02,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:06,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:05,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2131/17840 [3:35:52<16:05:06, 3.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:17:08,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2131/17840 [3:35:52<16:05:06, 3.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:17:08,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|██████��█▋ | 2132/17840 [3:35:54<14:38:54, 3.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:17:10,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2132/17840 [3:35:54<14:38:54, 3.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:17:10,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6128, 'learning_rate': 9.32957244655582e-05, 'epoch': 2.39} + 12%|████████▋ | 2133/17840 [3:35:57<13:18:54, 3.05s/it]g-point operations will not be computed-17 20:17:10,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2133/17840 [3:35:57<13:18:54, 3.05s/it]g-point operations will not be computed-17 20:17:10,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2134/17840 [3:35:59<12:04:36, 2.77s/it]g-point operations will not be computed-17 20:17:13,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2134/17840 [3:35:59<12:04:36, 2.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:17:16,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2134/17840 [3:35:59<12:04:36, 2.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:17:16,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:20,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:16,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:20,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:16,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2135/17840 [3:36:07<18:48:40, 4.31s/it]g-point operations will not be computed-17 20:17:16,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2135/17840 [3:36:07<18:48:40, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2135/17840 [3:36:07<18:48:40, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:28,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:28,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2136/17840 [3:36:14<23:05:16, 5.29s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2136/17840 [3:36:14<23:05:16, 5.29s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2136/17840 [3:36:14<23:05:16, 5.29s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2136/17840 [3:36:14<23:05:16, 5.29s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2136/17840 [3:36:14<23:05:16, 5.29s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2137/17840 [3:36:22<26:05:00, 5.98s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2137/17840 [3:36:22<26:05:00, 5.98s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:43,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:43,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2138/17840 [3:36:29<27:56:35, 6.41s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2138/17840 [3:36:29<27:56:35, 6.41s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2138/17840 [3:36:29<27:56:35, 6.41s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2138/17840 [3:36:29<27:56:35, 6.41s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2138/17840 [3:36:29<27:56:35, 6.41s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2139/17840 [3:36:37<29:11:22, 6.69s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2139/17840 [3:36:37<29:11:22, 6.69s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2139/17840 [3:36:37<29:11:22, 6.69s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2139/17840 [3:36:37<29:11:22, 6.69s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:59,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:59,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:59,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:59,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:17:59,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2141/17840 [3:36:51<30:26:33, 6.98s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2141/17840 [3:36:51<30:26:33, 6.98s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2141/17840 [3:36:51<30:26:33, 6.98s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2141/17840 [3:36:51<30:26:33, 6.98s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2141/17840 [3:36:51<30:26:33, 6.98s/it]g-point operations will not be computed-17 20:17:24,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2142/17840 [3:36:58<30:41:38, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2142/17840 [3:36:58<30:41:38, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2142/17840 [3:36:58<30:41:38, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2142/17840 [3:36:58<30:41:38, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2143/17840 [3:37:05<30:52:32, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2143/17840 [3:37:05<30:52:32, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2143/17840 [3:37:05<30:52:32, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:28,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:28,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8017, 'learning_rate': 9.322446555819478e-05, 'epoch': 2.4} +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:28,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:28,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:28,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2145/17840 [3:37:20<30:59:29, 7.11s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2145/17840 [3:37:20<30:59:29, 7.11s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2145/17840 [3:37:20<30:59:29, 7.11s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:42,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:42,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0177, 'learning_rate': 9.32125890736342e-05, 'epoch': 2.41} +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:42,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:42,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:42,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2147/17840 [3:37:34<30:51:01, 7.08s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2147/17840 [3:37:34<30:51:01, 7.08s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:18:55,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2148/17840 [3:37:41<30:42:45, 7.05s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2148/17840 [3:37:41<30:42:45, 7.05s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7081, 'learning_rate': 9.320071258907363e-05, 'epoch': 2.41} + 12%|████████▊ | 2148/17840 [3:37:41<30:42:45, 7.05s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2148/17840 [3:37:41<30:42:45, 7.05s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2148/17840 [3:37:41<30:42:45, 7.05s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2149/17840 [3:37:48<30:30:44, 7.00s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:07,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:07,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2150/17840 [3:37:57<33:25:40, 7.67s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2150/17840 [3:37:57<33:25:40, 7.67s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8025, 'learning_rate': 9.318883610451306e-05, 'epoch': 2.41} + 12%|████████▊ | 2150/17840 [3:37:57<33:25:40, 7.67s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:19,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:19,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8199, 'learning_rate': 9.318289786223278e-05, 'epoch': 2.41} +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:19,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:19,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:19,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2152/17840 [3:38:11<31:32:25, 7.24s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2152/17840 [3:38:11<31:32:25, 7.24s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:31,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2153/17840 [3:38:17<30:47:23, 7.07s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2153/17840 [3:38:17<30:47:23, 7.07s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7648, 'learning_rate': 9.317102137767222e-05, 'epoch': 2.41} + 12%|████████▊ | 2153/17840 [3:38:17<30:47:23, 7.07s/it]g-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:39,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:39,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6847, 'learning_rate': 9.316508313539193e-05, 'epoch': 2.41} +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:39,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:39,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:39,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:18:16,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2155/17840 [3:38:31<29:58:17, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2155/17840 [3:38:31<29:58:17, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2155/17840 [3:38:31<29:58:17, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2156/17840 [3:38:37<29:37:36, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2156/17840 [3:38:37<29:37:36, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:56,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:19:56,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2157/17840 [3:38:44<29:29:43, 6.77s/it]g-point operations will not be computed-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2157/17840 [3:38:44<29:29:43, 6.77s/it]g-point operations will not be computed-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7063, 'learning_rate': 9.314726840855108e-05, 'epoch': 2.42} +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:04,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2158/17840 [3:38:51<29:19:58, 6.73s/it]g-point operations will not be computed-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2158/17840 [3:38:51<29:19:58, 6.73s/it]g-point operations will not be computed-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6201, 'learning_rate': 9.31413301662708e-05, 'epoch': 2.42} + 12%|████████▊ | 2158/17840 [3:38:51<29:19:58, 6.73s/it]g-point operations will not be computed-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:13,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:13,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1939, 'learning_rate': 9.31353919239905e-05, 'epoch': 2.42} +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:13,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:13,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:13,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:19:48,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2160/17840 [3:39:04<28:47:25, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2160/17840 [3:39:04<28:47:25, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2160/17840 [3:39:04<28:47:25, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2161/17840 [3:39:10<28:31:07, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2161/17840 [3:39:10<28:31:07, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:29,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:29,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2162/17840 [3:39:16<28:19:16, 6.50s/it]g-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2162/17840 [3:39:16<28:19:16, 6.50s/it]g-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:35,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:35,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2163/17840 [3:39:23<28:01:22, 6.44s/it]g-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2163/17840 [3:39:23<28:01:22, 6.44s/it]g-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:41,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:41,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2164/17840 [3:39:29<27:44:24, 6.37s/it]g-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2164/17840 [3:39:29<27:44:24, 6.37s/it]g-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7947, 'learning_rate': 9.310570071258908e-05, 'epoch': 2.43} +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:49,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2165/17840 [3:39:35<27:30:06, 6.32s/it]g-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2165/17840 [3:39:35<27:30:06, 6.32s/it]g-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8079, 'learning_rate': 9.30997624703088e-05, 'epoch': 2.43} +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:55,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:20:55,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2166/17840 [3:39:41<27:09:28, 6.24s/it]g-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2166/17840 [3:39:41<27:09:28, 6.24s/it]g-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:01,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:01,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2167/17840 [3:39:47<27:02:32, 6.21s/it]g-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2167/17840 [3:39:47<27:02:32, 6.21s/it]g-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:07,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:07,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2168/17840 [3:39:53<26:46:26, 6.15s/it]g-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:12,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:12,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:12,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2169/17840 [3:39:59<26:24:24, 6.07s/it]g-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:18,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:18,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:18,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:20:21,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2170/17840 [3:40:05<25:55:30, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:21:22,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2170/17840 [3:40:05<25:55:30, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:21:22,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:26,598 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:22,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:26,598 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:22,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.645, 'learning_rate': 9.306413301662708e-05, 'epoch': 2.43} +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:30,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:22,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2172/17840 [3:40:16<25:17:33, 5.81s/it]g-point operations will not be computed-17 20:21:22,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2172/17840 [3:40:16<25:17:33, 5.81s/it]g-point operations will not be computed-17 20:21:22,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:34,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:22,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:34,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:22,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:34,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:22,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2173/17840 [3:40:22<24:45:05, 5.69s/it]g-point operations will not be computed-17 20:21:22,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:40,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:22,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:40,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:22,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:40,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:22,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2174/17840 [3:40:27<24:13:22, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:21:44,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:46,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:44,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:46,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:44,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2175/17840 [3:40:34<26:12:17, 6.02s/it]g-point operations will not be computed-17 20:21:44,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:52,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:44,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:54,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:44,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:54,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:44,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6436, 'learning_rate': 9.303444180522565e-05, 'epoch': 2.44} +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:58,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:44,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:21:58,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:21:44,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2177/17840 [3:40:43<23:02:32, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:00,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:02,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:00,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:02,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:00,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2178/17840 [3:40:47<21:36:25, 4.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:04,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2179/17840 [3:40:51<20:01:38, 4.60s/it]g-point operations will not be computed-17 20:22:04,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2179/17840 [3:40:51<20:01:38, 4.60s/it]g-point operations will not be computed-17 20:22:04,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2179/17840 [3:40:51<20:01:38, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:08,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2179/17840 [3:40:51<20:01:38, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:08,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2180/17840 [3:40:55<18:18:15, 4.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:11,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:12,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:11,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:12,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:11,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:15,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:14,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:15,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:14,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2182/17840 [3:41:00<14:56:24, 3.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:16,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2182/17840 [3:41:00<14:56:24, 3.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:16,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2183/17840 [3:41:02<13:26:21, 3.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:18,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2183/17840 [3:41:02<13:26:21, 3.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:18,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2184/17840 [3:41:04<12:06:06, 2.78s/it]g-point operations will not be computed-17 20:22:18,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2184/17840 [3:41:04<12:06:06, 2.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:22,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2184/17840 [3:41:04<12:06:06, 2.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:22,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:26,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:22,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:26,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:22,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2185/17840 [3:41:12<18:43:08, 4.30s/it]g-point operations will not be computed-17 20:22:22,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2185/17840 [3:41:12<18:43:08, 4.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:30,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2185/17840 [3:41:12<18:43:08, 4.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:30,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:33,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:30,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:33,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:30,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2186/17840 [3:41:20<22:56:40, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2186/17840 [3:41:20<22:56:40, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2186/17840 [3:41:20<22:56:40, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2187/17840 [3:41:27<25:45:35, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2187/17840 [3:41:27<25:45:35, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9252, 'learning_rate': 9.296912114014252e-05, 'epoch': 2.45} + 12%|████████▉ | 2187/17840 [3:41:27<25:45:35, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2187/17840 [3:41:27<25:45:35, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2187/17840 [3:41:27<25:45:35, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2188/17840 [3:41:35<27:43:59, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2188/17840 [3:41:35<27:43:59, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2188/17840 [3:41:35<27:43:59, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:57,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:57,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6189, 'learning_rate': 9.295724465558195e-05, 'epoch': 2.45} +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:57,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:22:57,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2190/17840 [3:41:49<29:53:18, 6.88s/it]g-point operations will not be computed-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2190/17840 [3:41:49<29:53:18, 6.88s/it]g-point operations will not be computed-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6154, 'learning_rate': 9.295130641330166e-05, 'epoch': 2.46} + 12%|████████▉ | 2190/17840 [3:41:49<29:53:18, 6.88s/it]g-point operations will not be computed-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2190/17840 [3:41:49<29:53:18, 6.88s/it]g-point operations will not be computed-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2190/17840 [3:41:49<29:53:18, 6.88s/it]g-point operations will not be computed-17 20:22:37,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2191/17840 [3:41:57<30:20:00, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2191/17840 [3:41:57<30:20:00, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2191/17840 [3:41:57<30:20:00, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2192/17840 [3:42:04<30:47:01, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2192/17840 [3:42:04<30:47:01, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9051, 'learning_rate': 9.29394299287411e-05, 'epoch': 2.46} + 12%|████████▉ | 2192/17840 [3:42:04<30:47:01, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2192/17840 [3:42:04<30:47:01, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2192/17840 [3:42:04<30:47:01, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2193/17840 [3:42:11<30:54:51, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2193/17840 [3:42:11<30:54:51, 7.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:32,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2194/17840 [3:42:18<31:01:28, 7.14s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2194/17840 [3:42:18<31:01:28, 7.14s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0098, 'learning_rate': 9.292755344418053e-05, 'epoch': 2.46} + 12%|████████▉ | 2194/17840 [3:42:18<31:01:28, 7.14s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2194/17840 [3:42:18<31:01:28, 7.14s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2194/17840 [3:42:18<31:01:28, 7.14s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2195/17840 [3:42:25<30:57:51, 7.13s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:44,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:44,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2196/17840 [3:42:32<30:49:19, 7.09s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2196/17840 [3:42:32<30:49:19, 7.09s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7955, 'learning_rate': 9.291567695961995e-05, 'epoch': 2.46} + 12%|████████▉ | 2196/17840 [3:42:32<30:49:19, 7.09s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:55,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:55,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6786, 'learning_rate': 9.290973871733967e-05, 'epoch': 2.46} +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:55,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:23:55,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2198/17840 [3:42:46<30:30:21, 7.02s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2198/17840 [3:42:46<30:30:21, 7.02s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:05,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:05,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2199/17840 [3:42:53<30:18:07, 6.97s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2199/17840 [3:42:53<30:18:07, 6.97s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7539, 'learning_rate': 9.28978622327791e-05, 'epoch': 2.47} + 12%|████████▉ | 2199/17840 [3:42:53<30:18:07, 6.97s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2199/17840 [3:42:53<30:18:07, 6.97s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2200/17840 [3:43:02<33:16:32, 7.66s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2200/17840 [3:43:02<33:16:32, 7.66s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.86, 'learning_rate': 9.289192399049882e-05, 'epoch': 2.47} +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:23,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2201/17840 [3:43:09<32:20:36, 7.45s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2201/17840 [3:43:09<32:20:36, 7.45s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7525, 'learning_rate': 9.288598574821853e-05, 'epoch': 2.47} + 12%|█████████ | 2201/17840 [3:43:09<32:20:36, 7.45s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2201/17840 [3:43:09<32:20:36, 7.45s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2201/17840 [3:43:09<32:20:36, 7.45s/it]g-point operations will not be computed-17 20:23:14,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2202/17840 [3:43:16<31:36:41, 7.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:24:33,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2202/17840 [3:43:16<31:36:41, 7.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:24:33,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2202/17840 [3:43:16<31:36:41, 7.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:24:33,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2203/17840 [3:43:23<30:56:03, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:24:33,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2203/17840 [3:43:23<30:56:03, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:24:33,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:42,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:33,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:24:42,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:33,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2204/17840 [3:43:30<30:22:50, 6.99s/it]g-point operations will not be computed-17 20:24:33,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2204/17840 [3:43:30<30:22:50, 6.99s/it]g-point operations will not be computed-17 20:24:33,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.589, 'learning_rate': 9.286817102137768e-05, 'epoch': 2.47} + 12%|█████████ | 2204/17840 [3:43:30<30:22:50, 6.99s/it]g-point operations will not be computed-17 20:24:33,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2204/17840 [3:43:30<30:22:50, 6.99s/it]g-point operations will not be computed-17 20:24:33,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2205/17840 [3:43:36<30:08:38, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2205/17840 [3:43:36<30:08:38, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9615, 'learning_rate': 9.28622327790974e-05, 'epoch': 2.47} + 12%|█████████ | 2205/17840 [3:43:36<30:08:38, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2206/17840 [3:43:43<29:54:10, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2206/17840 [3:43:43<29:54:10, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7987, 'learning_rate': 9.28562945368171e-05, 'epoch': 2.47} +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:04,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:04,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2207/17840 [3:43:50<29:43:37, 6.85s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2207/17840 [3:43:50<29:43:37, 6.85s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2207/17840 [3:43:50<29:43:37, 6.85s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:12,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:12,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7793, 'learning_rate': 9.284441805225653e-05, 'epoch': 2.48} +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:12,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:19,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:19,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6772, 'learning_rate': 9.283847980997625e-05, 'epoch': 2.48} +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:19,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:19,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:19,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2210/17840 [3:44:10<28:46:15, 6.63s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:28,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:28,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:28,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2211/17840 [3:44:16<28:34:22, 6.58s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:35,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:35,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:35,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2212/17840 [3:44:22<28:17:55, 6.52s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:41,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:41,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:41,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2213/17840 [3:44:29<28:02:21, 6.46s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:47,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:47,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:47,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2214/17840 [3:44:35<27:45:31, 6.40s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2214/17840 [3:44:35<27:45:31, 6.40s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:55,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:25:55,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2215/17840 [3:44:41<27:29:53, 6.34s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2215/17840 [3:44:41<27:29:53, 6.34s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2216/17840 [3:44:47<27:18:51, 6.29s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2216/17840 [3:44:47<27:18:51, 6.29s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:07,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:07,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2217/17840 [3:44:53<26:56:08, 6.21s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:12,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:12,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:12,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2218/17840 [3:44:59<26:25:26, 6.09s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2218/17840 [3:44:59<26:25:26, 6.09s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:19,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:19,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2219/17840 [3:45:05<25:59:44, 5.99s/it]g-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:23,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:24:54,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2220/17840 [3:45:11<25:33:20, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:26:28,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2220/17840 [3:45:11<25:33:20, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:26:28,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:32,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:28,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:32,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:28,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5913, 'learning_rate': 9.276722090261283e-05, 'epoch': 2.49} +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:36,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:28,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:36,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:28,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2222/17840 [3:45:21<24:31:59, 5.65s/it]g-point operations will not be computed-17 20:26:28,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:40,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:28,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:42,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:28,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:42,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:28,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8803, 'learning_rate': 9.275534441805225e-05, 'epoch': 2.49} +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:46,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:28,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:46,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:28,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2224/17840 [3:45:32<23:12:01, 5.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:51,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2225/17840 [3:45:38<24:46:08, 5.71s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2225/17840 [3:45:38<24:46:08, 5.71s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:56,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:58,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:26:58,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:00,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:02,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:02,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:04,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:04,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:06,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:09,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:09,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:11,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:12,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:12,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:15,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:15,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:16,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:16,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:19,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:19,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:21,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:22,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:22,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6326, 'learning_rate': 9.269002375296912e-05, 'epoch': 2.5} +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:26,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:26,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:26,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:30,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:30,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:34,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:34,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:34,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:37,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:37,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:27:43,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2237/17840 [3:46:30<25:50:59, 5.96s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2237/17840 [3:46:30<25:50:59, 5.96s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0517, 'learning_rate': 9.267220902612827e-05, 'epoch': 2.51} + 13%|█████████▏ | 2237/17840 [3:46:30<25:50:59, 5.96s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2237/17840 [3:46:30<25:50:59, 5.96s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2237/17840 [3:46:30<25:50:59, 5.96s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2238/17840 [3:46:37<27:37:53, 6.38s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2238/17840 [3:46:37<27:37:53, 6.38s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2238/17840 [3:46:37<27:37:53, 6.38s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:00,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:00,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6716, 'learning_rate': 9.26603325415677e-05, 'epoch': 2.51} +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:00,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:00,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2240/17840 [3:46:52<29:45:56, 6.87s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2240/17840 [3:46:52<29:45:56, 6.87s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6942, 'learning_rate': 9.265439429928742e-05, 'epoch': 2.51} + 13%|█████████▏ | 2240/17840 [3:46:52<29:45:56, 6.87s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2240/17840 [3:46:52<29:45:56, 6.87s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2240/17840 [3:46:52<29:45:56, 6.87s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2241/17840 [3:46:59<30:21:48, 7.01s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:18,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:18,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2242/17840 [3:47:06<30:34:42, 7.06s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2242/17840 [3:47:06<30:34:42, 7.06s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6898, 'learning_rate': 9.264251781472685e-05, 'epoch': 2.51} + 13%|█████████▏ | 2242/17840 [3:47:06<30:34:42, 7.06s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2242/17840 [3:47:06<30:34:42, 7.06s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2242/17840 [3:47:06<30:34:42, 7.06s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2243/17840 [3:47:13<30:50:56, 7.12s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2243/17840 [3:47:13<30:50:56, 7.12s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:34,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2244/17840 [3:47:21<31:01:46, 7.16s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2244/17840 [3:47:21<31:01:46, 7.16s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.831, 'learning_rate': 9.263064133016627e-05, 'epoch': 2.52} + 13%|█████████▏ | 2244/17840 [3:47:21<31:01:46, 7.16s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2244/17840 [3:47:21<31:01:46, 7.16s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2244/17840 [3:47:21<31:01:46, 7.16s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2245/17840 [3:47:28<31:03:04, 7.17s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2245/17840 [3:47:28<31:03:04, 7.17s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:28:49,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2246/17840 [3:47:35<30:56:42, 7.14s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2246/17840 [3:47:35<30:56:42, 7.14s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7538, 'learning_rate': 9.261876484560571e-05, 'epoch': 2.52} + 13%|█████████▏ | 2246/17840 [3:47:35<30:56:42, 7.14s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2246/17840 [3:47:35<30:56:42, 7.14s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2246/17840 [3:47:35<30:56:42, 7.14s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2247/17840 [3:47:42<30:47:32, 7.11s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:01,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:01,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2248/17840 [3:47:49<30:38:04, 7.07s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2248/17840 [3:47:49<30:38:04, 7.07s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7396, 'learning_rate': 9.260688836104513e-05, 'epoch': 2.52} + 13%|█████████▏ | 2248/17840 [3:47:49<30:38:04, 7.07s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2248/17840 [3:47:49<30:38:04, 7.07s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2248/17840 [3:47:49<30:38:04, 7.07s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2249/17840 [3:47:56<30:34:13, 7.06s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:15,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:15,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2250/17840 [3:48:05<33:26:32, 7.72s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2250/17840 [3:48:05<33:26:32, 7.72s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5454, 'learning_rate': 9.259501187648455e-05, 'epoch': 2.52} + 13%|█████████▏ | 2250/17840 [3:48:05<33:26:32, 7.72s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2250/17840 [3:48:05<33:26:32, 7.72s/it]g-point operations will not be computed-17 20:26:48,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2251/17840 [3:48:12<32:24:22, 7.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2251/17840 [3:48:12<32:24:22, 7.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6862, 'learning_rate': 9.258907363420429e-05, 'epoch': 2.52} + 13%|█████████▏ | 2251/17840 [3:48:12<32:24:22, 7.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2252/17840 [3:48:19<31:33:20, 7.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2252/17840 [3:48:19<31:33:20, 7.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6563, 'learning_rate': 9.2583135391924e-05, 'epoch': 2.52} + 13%|█████████▏ | 2252/17840 [3:48:19<31:33:20, 7.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:41,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:41,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8249, 'learning_rate': 9.257719714964372e-05, 'epoch': 2.53} +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:41,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:41,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2254/17840 [3:48:33<30:28:23, 7.04s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2254/17840 [3:48:33<30:28:23, 7.04s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:51,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:29:51,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2255/17840 [3:48:39<30:02:47, 6.94s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2255/17840 [3:48:39<30:02:47, 6.94s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6829, 'learning_rate': 9.256532066508314e-05, 'epoch': 2.53} +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:00,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2256/17840 [3:48:46<29:50:02, 6.89s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2256/17840 [3:48:46<29:50:02, 6.89s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0343, 'learning_rate': 9.255938242280285e-05, 'epoch': 2.53} + 13%|█████████▏ | 2256/17840 [3:48:46<29:50:02, 6.89s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:08,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:08,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7731, 'learning_rate': 9.255344418052257e-05, 'epoch': 2.53} +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:08,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:08,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2258/17840 [3:48:59<29:16:02, 6.76s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2258/17840 [3:48:59<29:16:02, 6.76s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:18,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:18,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2259/17840 [3:49:06<28:54:40, 6.68s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2259/17840 [3:49:06<28:54:40, 6.68s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9682, 'learning_rate': 9.2541567695962e-05, 'epoch': 2.53} +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:26,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:26,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2260/17840 [3:49:12<28:39:42, 6.62s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2260/17840 [3:49:12<28:39:42, 6.62s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2260/17840 [3:49:12<28:39:42, 6.62s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2260/17840 [3:49:12<28:39:42, 6.62s/it]g-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:34,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:34,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:34,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:40,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:40,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7534, 'learning_rate': 9.252375296912114e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:40,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:47,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:47,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6388, 'learning_rate': 9.251781472684085e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:47,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:53,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:53,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.75, 'learning_rate': 9.251187648456057e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:53,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:53,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:30:53,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:29:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2265/17840 [3:49:44<27:10:10, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2265/17840 [3:49:44<27:10:10, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:05,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:05,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5732, 'learning_rate': 9.250000000000001e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:05,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:11,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:11,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7539, 'learning_rate': 9.249406175771972e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:11,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:17,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:17,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8466, 'learning_rate': 9.248812351543944e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:21,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:21,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2269/17840 [3:50:07<25:59:22, 6.01s/it]g-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:26,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:26,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:26,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2270/17840 [3:50:13<25:41:59, 5.94s/it]g-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:32,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:32,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:32,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:01,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2271/17840 [3:50:19<25:21:11, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:36,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2271/17840 [3:50:19<25:21:11, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:36,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:40,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:36,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:40,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:36,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4145, 'learning_rate': 9.24643705463183e-05, 'epoch': 2.55} +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:44,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:36,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:44,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:36,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2273/17840 [3:50:30<24:17:51, 5.62s/it]g-point operations will not be computed-17 20:31:36,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:48,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:36,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:48,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:36,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:48,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:36,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2274/17840 [3:50:35<23:40:53, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:31:52,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:54,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:52,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:31:54,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:52,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2275/17840 [3:50:42<25:36:12, 5.92s/it]g-point operations will not be computed-17 20:31:52,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:00,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:52,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:02,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:52,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:02,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:52,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4747, 'learning_rate': 9.244061757719715e-05, 'epoch': 2.55} +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:05,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:52,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:05,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:31:52,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2277/17840 [3:50:51<22:14:01, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:07,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2278/17840 [3:50:55<20:37:26, 4.77s/it]g-point operations will not be computed-17 20:32:07,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2278/17840 [3:50:55<20:37:26, 4.77s/it]g-point operations will not be computed-17 20:32:07,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2278/17840 [3:50:55<20:37:26, 4.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:11,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2278/17840 [3:50:55<20:37:26, 4.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:11,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2279/17840 [3:50:58<19:01:12, 4.40s/it]g-point operations will not be computed-17 20:32:11,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:16,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:14,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:16,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:14,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2280/17840 [3:51:01<17:29:37, 4.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:18,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2281/17840 [3:51:04<16:07:00, 3.73s/it]g-point operations will not be computed-17 20:32:18,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2281/17840 [3:51:04<16:07:00, 3.73s/it]g-point operations will not be computed-17 20:32:18,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2282/17840 [3:51:07<14:43:26, 3.41s/it]g-point operations will not be computed-17 20:32:21,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2282/17840 [3:51:07<14:43:26, 3.41s/it]g-point operations will not be computed-17 20:32:21,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:24,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:23,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:24,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:23,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2283/17840 [3:51:09<13:19:36, 3.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:25,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2283/17840 [3:51:09<13:19:36, 3.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:25,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2284/17840 [3:51:11<12:02:51, 2.79s/it]g-point operations will not be computed-17 20:32:25,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2284/17840 [3:51:11<12:02:51, 2.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:29,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2284/17840 [3:51:11<12:02:51, 2.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:29,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:33,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:29,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:33,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:29,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2285/17840 [3:51:19<18:41:42, 4.33s/it]g-point operations will not be computed-17 20:32:29,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2285/17840 [3:51:19<18:41:42, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:37,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:32:41,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:37,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2286/17840 [3:51:27<23:00:19, 5.32s/it]g-point operations will not be computed-17 20:32:37,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2286/17840 [3:51:27<23:00:19, 5.32s/it]g-point operations will not be computed-17 20:32:37,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2286/17840 [3:51:27<23:00:19, 5.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2286/17840 [3:51:27<23:00:19, 5.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2286/17840 [3:51:27<23:00:19, 5.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2287/17840 [3:51:35<25:51:29, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2287/17840 [3:51:35<25:51:29, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9059, 'learning_rate': 9.237529691211402e-05, 'epoch': 2.56} + 13%|█████████▎ | 2287/17840 [3:51:35<25:51:29, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2287/17840 [3:51:35<25:51:29, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2287/17840 [3:51:35<25:51:29, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2288/17840 [3:51:42<27:37:52, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:01,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:01,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2289/17840 [3:51:49<28:54:21, 6.69s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2289/17840 [3:51:49<28:54:21, 6.69s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7038, 'learning_rate': 9.236342042755344e-05, 'epoch': 2.57} + 13%|█████████▎ | 2289/17840 [3:51:49<28:54:21, 6.69s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2289/17840 [3:51:49<28:54:21, 6.69s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2289/17840 [3:51:49<28:54:21, 6.69s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2290/17840 [3:51:57<29:42:18, 6.88s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2290/17840 [3:51:57<29:42:18, 6.88s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2290/17840 [3:51:57<29:42:18, 6.88s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:19,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:19,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7621, 'learning_rate': 9.235154394299289e-05, 'epoch': 2.57} +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:19,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:19,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2292/17840 [3:52:11<30:19:18, 7.02s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2292/17840 [3:52:11<30:19:18, 7.02s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7855, 'learning_rate': 9.234560570071259e-05, 'epoch': 2.57} + 13%|█████████▍ | 2292/17840 [3:52:11<30:19:18, 7.02s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:34,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:34,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.924, 'learning_rate': 9.233966745843231e-05, 'epoch': 2.57} +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:34,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:34,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:34,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2294/17840 [3:52:25<30:33:02, 7.07s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2294/17840 [3:52:25<30:33:02, 7.07s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2294/17840 [3:52:25<30:33:02, 7.07s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:48,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:48,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8057, 'learning_rate': 9.232779097387174e-05, 'epoch': 2.57} +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:48,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:48,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:33:48,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2296/17840 [3:52:39<30:25:45, 7.05s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2296/17840 [3:52:39<30:25:45, 7.05s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:00,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2297/17840 [3:52:46<30:18:12, 7.02s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2297/17840 [3:52:46<30:18:12, 7.02s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1835, 'learning_rate': 9.231591448931117e-05, 'epoch': 2.58} + 13%|█████████▍ | 2297/17840 [3:52:46<30:18:12, 7.02s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:09,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:09,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7264, 'learning_rate': 9.230997624703089e-05, 'epoch': 2.58} +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:09,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:09,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|███████��█▍ | 2299/17840 [3:53:00<30:18:17, 7.02s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2299/17840 [3:53:00<30:18:17, 7.02s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6432, 'learning_rate': 9.230403800475061e-05, 'epoch': 2.58} + 13%|█████████▍ | 2299/17840 [3:53:00<30:18:17, 7.02s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2299/17840 [3:53:00<30:18:17, 7.02s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2300/17840 [3:53:09<33:06:37, 7.67s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2300/17840 [3:53:09<33:06:37, 7.67s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6338, 'learning_rate': 9.229809976247031e-05, 'epoch': 2.58} + 13%|█████████▍ | 2300/17840 [3:53:09<33:06:37, 7.67s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2300/17840 [3:53:09<33:06:37, 7.67s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2301/17840 [3:53:16<32:04:52, 7.43s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2301/17840 [3:53:16<32:04:52, 7.43s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8313, 'learning_rate': 9.229216152019002e-05, 'epoch': 2.58} +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:37,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2302/17840 [3:53:23<31:22:56, 7.27s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2302/17840 [3:53:23<31:22:56, 7.27s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6593, 'learning_rate': 9.228622327790974e-05, 'epoch': 2.58} + 13%|█████████▍ | 2302/17840 [3:53:23<31:22:56, 7.27s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:45,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:45,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:49,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:49,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2304/17840 [3:53:37<30:19:21, 7.03s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2304/17840 [3:53:37<30:19:21, 7.03s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9019, 'learning_rate': 9.227434679334917e-05, 'epoch': 2.58} +[WARNING|modeling_utils.py:388] 2022-03-17 20:34:57,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2305/17840 [3:53:43<29:55:51, 6.94s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2305/17840 [3:53:43<29:55:51, 6.94s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7173, 'learning_rate': 9.226840855106889e-05, 'epoch': 2.58} + 13%|█████████▍ | 2305/17840 [3:53:43<29:55:51, 6.94s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:06,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:06,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:06,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6688, 'learning_rate': 9.226247030878861e-05, 'epoch': 2.59} +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:06,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2307/17840 [3:53:57<29:30:03, 6.84s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2307/17840 [3:53:57<29:30:03, 6.84s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7379, 'learning_rate': 9.225653206650832e-05, 'epoch': 2.59} +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:17,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2308/17840 [3:54:04<29:14:33, 6.78s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2308/17840 [3:54:04<29:14:33, 6.78s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8043, 'learning_rate': 9.225059382422804e-05, 'epoch': 2.59} +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:24,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:24,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2309/17840 [3:54:10<28:58:57, 6.72s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2309/17840 [3:54:10<28:58:57, 6.72s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2309/17840 [3:54:10<28:58:57, 6.72s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:32,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:32,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6502, 'learning_rate': 9.223871733966746e-05, 'epoch': 2.59} +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:32,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:32,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:32,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2311/17840 [3:54:23<28:34:02, 6.62s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:42,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:42,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:42,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2312/17840 [3:54:30<28:20:24, 6.57s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2312/17840 [3:54:30<28:20:24, 6.57s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:50,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:50,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2313/17840 [3:54:36<28:07:53, 6.52s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2313/17840 [3:54:36<28:07:53, 6.52s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:56,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:35:56,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2314/17840 [3:54:42<27:53:41, 6.47s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2314/17840 [3:54:42<27:53:41, 6.47s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:03,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:03,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2315/17840 [3:54:49<27:38:05, 6.41s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2315/17840 [3:54:49<27:38:05, 6.41s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2315/17840 [3:54:49<27:38:05, 6.41s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:10,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:10,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5197, 'learning_rate': 9.220308788598575e-05, 'epoch': 2.6} +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:15,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:15,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2317/17840 [3:55:01<27:07:09, 6.29s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2317/17840 [3:55:01<27:07:09, 6.29s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:21,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:21,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2318/17840 [3:55:07<26:55:39, 6.25s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2318/17840 [3:55:07<26:55:39, 6.25s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:27,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:27,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2319/17840 [3:55:13<26:35:24, 6.17s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2319/17840 [3:55:13<26:35:24, 6.17s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:33,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:33,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2320/17840 [3:55:19<26:14:54, 6.09s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2320/17840 [3:55:19<26:14:54, 6.09s/it]g-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:39,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:39,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:32:44,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2321/17840 [3:55:25<25:48:58, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:36:42,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2321/17840 [3:55:25<25:48:58, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:36:42,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2321/17840 [3:55:25<25:48:58, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:36:42,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████���███▍ | 2321/17840 [3:55:25<25:48:58, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:36:42,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2322/17840 [3:55:31<25:21:38, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:36:47,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2322/17840 [3:55:31<25:21:38, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:36:47,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:51,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:47,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:51,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:47,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6938, 'learning_rate': 9.216152019002375e-05, 'epoch': 2.6} +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:55,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:47,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:55,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:47,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2324/17840 [3:55:41<24:02:48, 5.58s/it]g-point operations will not be computed-17 20:36:47,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:59,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:47,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:36:59,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:47,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2325/17840 [3:55:48<26:08:20, 6.07s/it]g-point operations will not be computed-17 20:36:47,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2325/17840 [3:55:48<26:08:20, 6.07s/it]g-point operations will not be computed-17 20:36:47,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5427, 'learning_rate': 9.214964370546319e-05, 'epoch': 2.61} +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:07,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:47,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:07,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:36:47,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2326/17840 [3:55:53<24:24:41, 5.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:10,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:12,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:10,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:12,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:10,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2327/17840 [3:55:58<22:51:48, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:14,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:16,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:14,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:16,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:14,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2328/17840 [3:56:02<21:14:45, 4.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:18,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:20,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:18,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:20,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:18,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2329/17840 [3:56:05<19:39:09, 4.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:22,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2330/17840 [3:56:09<18:00:55, 4.18s/it]g-point operations will not be computed-17 20:37:22,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2330/17840 [3:56:09<18:00:55, 4.18s/it]g-point operations will not be computed-17 20:37:22,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:26,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:25,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:26,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:25,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2331/17840 [3:56:12<16:28:51, 3.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:28,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2331/17840 [3:56:12<16:28:51, 3.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:28,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2332/17840 [3:56:14<14:57:32, 3.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:30,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2333/17840 [3:56:17<13:28:56, 3.13s/it]g-point operations will not be computed-17 20:37:30,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2333/17840 [3:56:17<13:28:56, 3.13s/it]g-point operations will not be computed-17 20:37:30,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2334/17840 [3:56:19<12:07:21, 2.81s/it]g-point operations will not be computed-17 20:37:33,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2334/17840 [3:56:19<12:07:21, 2.81s/it]g-point operations will not be computed-17 20:37:33,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2334/17840 [3:56:19<12:07:21, 2.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:36,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2334/17840 [3:56:19<12:07:21, 2.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:36,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:40,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:36,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2335/17840 [3:56:27<18:47:32, 4.36s/it]g-point operations will not be computed-17 20:37:36,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2335/17840 [3:56:27<18:47:32, 4.36s/it]g-point operations will not be computed-17 20:37:36,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2335/17840 [3:56:27<18:47:32, 4.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2335/17840 [3:56:27<18:47:32, 4.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:37:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:48,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:37:48,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:37:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2336/17840 [3:56:34<23:07:19, 5.37s/it]g-point operations will not be computed-17 20:37:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2336/17840 [3:56:34<23:07:19, 5.37s/it]g-point operations will not be computed-17 20:37:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2336/17840 [3:56:34<23:07:19, 5.37s/it]g-point operations will not be computed-17 20:37:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2336/17840 [3:56:34<23:07:19, 5.37s/it]g-point operations will not be computed-17 20:37:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2336/17840 [3:56:34<23:07:19, 5.37s/it]g-point operations will not be computed-17 20:37:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2337/17840 [3:56:42<25:55:31, 6.02s/it]g-point operations will not be computed-17 20:37:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2337/17840 [3:56:42<25:55:31, 6.02s/it]g-point operations will not be computed-17 20:37:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2337/17840 [3:56:42<25:55:31, 6.02s/it]g-point operations will not be computed-17 20:37:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2337/17840 [3:56:42<25:55:31, 6.02s/it]g-point operations will not be computed-17 20:37:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2337/17840 [3:56:42<25:55:31, 6.02s/it]g-point operations will not be computed-17 20:37:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2338/17840 [3:56:49<27:45:54, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2338/17840 [3:56:49<27:45:54, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2338/17840 [3:56:49<27:45:54, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2339/17840 [3:56:57<28:58:09, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2339/17840 [3:56:57<28:58:09, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6303, 'learning_rate': 9.20665083135392e-05, 'epoch': 2.62} + 13%|█████████▌ | 2339/17840 [3:56:57<28:58:09, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2339/17840 [3:56:57<28:58:09, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2339/17840 [3:56:57<28:58:09, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2340/17840 [3:57:04<29:51:41, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2340/17840 [3:57:04<29:51:41, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2340/17840 [3:57:04<29:51:41, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:27,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:27,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7408, 'learning_rate': 9.205463182897862e-05, 'epoch': 2.62} +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:27,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:27,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:27,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2342/17840 [3:57:19<30:42:32, 7.13s/it]g-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2342/17840 [3:57:19<30:42:32, 7.13s/it]g-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2342/17840 [3:57:19<30:42:32, 7.13s/it]g-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:42,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:42,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7329, 'learning_rate': 9.204275534441805e-05, 'epoch': 2.63} +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:42,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:38:42,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2344/17840 [3:57:33<30:58:53, 7.20s/it]g-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2344/17840 [3:57:33<30:58:53, 7.20s/it]g-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8398, 'learning_rate': 9.203681710213778e-05, 'epoch': 2.63} + 13%|█████████▌ | 2344/17840 [3:57:33<30:58:53, 7.20s/it]g-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2344/17840 [3:57:33<30:58:53, 7.20s/it]g-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2344/17840 [3:57:33<30:58:53, 7.20s/it]g-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2345/17840 [3:57:40<30:53:24, 7.18s/it]g-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:00,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:00,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2346/17840 [3:57:48<30:49:31, 7.16s/it]g-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2346/17840 [3:57:48<30:49:31, 7.16s/it]g-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.76, 'learning_rate': 9.202494061757721e-05, 'epoch': 2.63} + 13%|█████████▌ | 2346/17840 [3:57:48<30:49:31, 7.16s/it]g-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2346/17840 [3:57:48<30:49:31, 7.16s/it]g-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2346/17840 [3:57:48<30:49:31, 7.16s/it]g-point operations will not be computed-17 20:38:07,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2347/17840 [3:57:55<30:43:12, 7.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2347/17840 [3:57:55<30:43:12, 7.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2347/17840 [3:57:55<30:43:12, 7.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2348/17840 [3:58:02<30:40:21, 7.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2348/17840 [3:58:02<30:40:21, 7.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.632, 'learning_rate': 9.201306413301663e-05, 'epoch': 2.63} + 13%|█████████▌ | 2348/17840 [3:58:02<30:40:21, 7.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:24,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:24,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7498, 'learning_rate': 9.200712589073634e-05, 'epoch': 2.63} +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:24,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:24,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2350/17840 [3:58:18<33:24:36, 7.76s/it]g-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2350/17840 [3:58:18<33:24:36, 7.76s/it]g-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8905, 'learning_rate': 9.200118764845606e-05, 'epoch': 2.63} + 13%|█████████▌ | 2350/17840 [3:58:18<33:24:36, 7.76s/it]g-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:40,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:40,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7283, 'learning_rate': 9.199524940617578e-05, 'epoch': 2.64} +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:40,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:40,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2352/17840 [3:58:32<31:30:11, 7.32s/it]g-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2352/17840 [3:58:32<31:30:11, 7.32s/it]g-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:51,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:51,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2353/17840 [3:58:39<30:47:00, 7.16s/it]g-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2353/17840 [3:58:39<30:47:00, 7.16s/it]g-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8339, 'learning_rate': 9.198337292161521e-05, 'epoch': 2.64} +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:59,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:39:59,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2354/17840 [3:58:45<30:13:51, 7.03s/it]g-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2354/17840 [3:58:45<30:13:51, 7.03s/it]g-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2354/17840 [3:58:45<30:13:51, 7.03s/it]g-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2354/17840 [3:58:45<30:13:51, 7.03s/it]g-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2354/17840 [3:58:45<30:13:51, 7.03s/it]g-point operations will not be computed-17 20:39:12,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2355/17840 [3:58:52<29:47:13, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2355/17840 [3:58:52<29:47:13, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2355/17840 [3:58:52<29:47:13, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2355/17840 [3:58:52<29:47:13, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2356/17840 [3:58:59<29:23:01, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:18,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:18,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:18,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2357/17840 [3:59:05<29:09:28, 6.78s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2357/17840 [3:59:05<29:09:28, 6.78s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2357/17840 [3:59:05<29:09:28, 6.78s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2357/17840 [3:59:05<29:09:28, 6.78s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:27,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:27,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:27,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:34,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:34,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9171, 'learning_rate': 9.19477434679335e-05, 'epoch': 2.64} +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:34,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:34,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:34,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2360/17840 [3:59:25<28:25:03, 6.61s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:44,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:44,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:44,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2361/17840 [3:59:31<28:13:45, 6.57s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2361/17840 [3:59:31<28:13:45, 6.57s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:52,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:52,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2362/17840 [3:59:38<27:59:08, 6.51s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2362/17840 [3:59:38<27:59:08, 6.51s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:58,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:40:58,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2363/17840 [3:59:44<27:40:20, 6.44s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2363/17840 [3:59:44<27:40:20, 6.44s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:04,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:04,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2364/17840 [3:59:50<27:27:30, 6.39s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2364/17840 [3:59:50<27:27:30, 6.39s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2364/17840 [3:59:50<27:27:30, 6.39s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2364/17840 [3:59:50<27:27:30, 6.39s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:12,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:12,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:12,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:12,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:18,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:18,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:18,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:18,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:24,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:24,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:24,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:24,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:30,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:30,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:35,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:35,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2369/17840 [4:00:21<26:04:15, 6.07s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2369/17840 [4:00:21<26:04:15, 6.07s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:41,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:41,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2370/17840 [4:00:26<25:39:26, 5.97s/it]g-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:45,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:45,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:45,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:40:09,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2371/17840 [4:00:32<25:17:46, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:41:49,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2371/17840 [4:00:32<25:17:46, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:41:49,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:53,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:41:49,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:53,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:41:49,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6398, 'learning_rate': 9.187054631828979e-05, 'epoch': 2.66} +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:57,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:41:49,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:41:57,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:41:49,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2373/17840 [4:00:43<24:16:28, 5.65s/it]g-point operations will not be computed-17 20:41:49,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:01,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:41:49,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:01,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:41:49,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:01,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:41:49,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2374/17840 [4:00:48<23:34:23, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:07,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:07,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2375/17840 [4:00:55<25:24:58, 5.92s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:13,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:15,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:15,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:17,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:19,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:19,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:21,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:23,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:23,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:25,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:25,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:27,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:29,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:29,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:30,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:33,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:33,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:35,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:35,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:37,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:37,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:38,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:38,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:41,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:41,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:45,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:45,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:45,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:48,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:48,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:52,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:52,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:42:52,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2386/17840 [4:01:40<22:40:16, 5.28s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2386/17840 [4:01:40<22:40:16, 5.28s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:02,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.763, 'learning_rate': 9.178147268408551e-05, 'epoch': 2.68} + g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2388/17840 [4:01:55<27:29:05, 6.40s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2388/17840 [4:01:55<27:29:05, 6.40s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2388/17840 [4:01:55<27:29:05, 6.40s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:18,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:18,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7369, 'learning_rate': 9.176959619952494e-05, 'epoch': 2.68} +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:18,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:18,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:18,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2390/17840 [4:02:10<29:26:15, 6.86s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2390/17840 [4:02:10<29:26:15, 6.86s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2390/17840 [4:02:10<29:26:15, 6.86s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2390/17840 [4:02:10<29:26:15, 6.86s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2390/17840 [4:02:10<29:26:15, 6.86s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2391/17840 [4:02:17<30:02:59, 7.00s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2391/17840 [4:02:17<30:02:59, 7.00s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:38,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2392/17840 [4:02:25<30:20:10, 7.07s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2392/17840 [4:02:25<30:20:10, 7.07s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8142, 'learning_rate': 9.17517814726841e-05, 'epoch': 2.68} + 13%|█████████▊ | 2392/17840 [4:02:25<30:20:10, 7.07s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2392/17840 [4:02:25<30:20:10, 7.07s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2392/17840 [4:02:25<30:20:10, 7.07s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2393/17840 [4:02:32<30:31:04, 7.11s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2393/17840 [4:02:32<30:31:04, 7.11s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:43:53,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2394/17840 [4:02:39<30:35:25, 7.13s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2394/17840 [4:02:39<30:35:25, 7.13s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4934, 'learning_rate': 9.173990498812351e-05, 'epoch': 2.68} + 13%|█████████▊ | 2394/17840 [4:02:39<30:35:25, 7.13s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2394/17840 [4:02:39<30:35:25, 7.13s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2394/17840 [4:02:39<30:35:25, 7.13s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2395/17840 [4:02:46<30:32:41, 7.12s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:05,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:05,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2396/17840 [4:02:53<30:28:34, 7.10s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2396/17840 [4:02:53<30:28:34, 7.10s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6808, 'learning_rate': 9.172802850356294e-05, 'epoch': 2.69} + 13%|█████████▊ | 2396/17840 [4:02:53<30:28:34, 7.10s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2396/17840 [4:02:53<30:28:34, 7.10s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2396/17840 [4:02:53<30:28:34, 7.10s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2397/17840 [4:03:00<30:26:25, 7.10s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:19,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:19,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:19,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2398/17840 [4:03:07<30:15:26, 7.05s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2398/17840 [4:03:07<30:15:26, 7.05s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2398/17840 [4:03:07<30:15:26, 7.05s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:30,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:30,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7396, 'learning_rate': 9.17102137767221e-05, 'epoch': 2.69} +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:30,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:30,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:30,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2400/17840 [4:03:24<33:05:54, 7.72s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2400/17840 [4:03:24<33:05:54, 7.72s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2400/17840 [4:03:24<33:05:54, 7.72s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:46,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:46,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7618, 'learning_rate': 9.169833729216153e-05, 'epoch': 2.69} +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:46,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:46,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:46,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2402/17840 [4:03:37<31:17:12, 7.30s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:56,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:44:56,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2403/17840 [4:03:44<30:42:11, 7.16s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2403/17840 [4:03:44<30:42:11, 7.16s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8395, 'learning_rate': 9.168646080760096e-05, 'epoch': 2.69} + 13%|█████████▊ | 2403/17840 [4:03:44<30:42:11, 7.16s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2403/17840 [4:03:44<30:42:11, 7.16s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2403/17840 [4:03:44<30:42:11, 7.16s/it]g-point operations will not be computed-17 20:42:05,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2404/17840 [4:03:51<30:21:57, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2404/17840 [4:03:51<30:21:57, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2404/17840 [4:03:51<30:21:57, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2404/17840 [4:03:51<30:21:57, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2405/17840 [4:03:58<30:00:04, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2405/17840 [4:03:58<30:00:04, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:18,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2406/17840 [4:04:04<29:35:20, 6.90s/it]g-point operations will not be computed-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2406/17840 [4:04:04<29:35:20, 6.90s/it]g-point operations will not be computed-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.818, 'learning_rate': 9.16686460807601e-05, 'epoch': 2.7} + 13%|█████████▊ | 2406/17840 [4:04:04<29:35:20, 6.90s/it]g-point operations will not be computed-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:27,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:27,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8661, 'learning_rate': 9.166270783847981e-05, 'epoch': 2.7} +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:27,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:27,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:27,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:08,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2408/17840 [4:04:18<29:05:32, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2408/17840 [4:04:18<29:05:32, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2408/17840 [4:04:18<29:05:32, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2408/17840 [4:04:18<29:05:32, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2409/17840 [4:04:24<28:46:52, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:43,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:43,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2410/17840 [4:04:31<28:34:14, 6.67s/it]g-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2410/17840 [4:04:31<28:34:14, 6.67s/it]g-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5392, 'learning_rate': 9.164489311163896e-05, 'epoch': 2.7} +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:51,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2411/17840 [4:04:37<28:14:40, 6.59s/it]g-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2411/17840 [4:04:37<28:14:40, 6.59s/it]g-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0121, 'learning_rate': 9.163895486935868e-05, 'epoch': 2.7} +[WARNING|modeling_utils.py:388] 2022-03-17 20:45:58,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2412/17840 [4:04:44<28:01:17, 6.54s/it]g-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2412/17840 [4:04:44<28:01:17, 6.54s/it]g-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5904, 'learning_rate': 9.16330166270784e-05, 'epoch': 2.7} + 14%|█████████▊ | 2412/17840 [4:04:44<28:01:17, 6.54s/it]g-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:06,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:06,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5731, 'learning_rate': 9.16270783847981e-05, 'epoch': 2.71} +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:06,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:06,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:06,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:45:35,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2414/17840 [4:04:57<27:45:08, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2414/17840 [4:04:57<27:45:08, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2414/17840 [4:04:57<27:45:08, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2414/17840 [4:04:57<27:45:08, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2415/17840 [4:05:03<27:34:17, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:22,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:22,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2416/17840 [4:05:09<27:18:18, 6.37s/it]g-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2416/17840 [4:05:09<27:18:18, 6.37s/it]g-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:28,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:28,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2417/17840 [4:05:15<27:10:23, 6.34s/it]g-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2417/17840 [4:05:15<27:10:23, 6.34s/it]g-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:34,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:34,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2418/17840 [4:05:22<26:50:48, 6.27s/it]g-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2418/17840 [4:05:22<26:50:48, 6.27s/it]g-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:40,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:40,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:40,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2419/17840 [4:05:27<26:25:24, 6.17s/it]g-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:46,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:46,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:46,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:14,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2420/17840 [4:05:33<25:54:13, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:50,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2420/17840 [4:05:33<25:54:13, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:46:50,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:54,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:50,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:54,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:50,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7213, 'learning_rate': 9.157957244655583e-05, 'epoch': 2.71} +[WARNING|modeling_utils.py:388] 2022-03-17 20:46:54,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:50,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:00,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:50,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:00,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:50,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5352, 'learning_rate': 9.157363420427553e-05, 'epoch': 2.72} +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:04,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:46:50,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2423/17840 [4:05:50<24:26:24, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2423/17840 [4:05:50<24:26:24, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7513, 'learning_rate': 9.156769596199525e-05, 'epoch': 2.72} +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:11,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:11,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5952, 'learning_rate': 9.156175771971497e-05, 'epoch': 2.72} +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:14,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2425/17840 [4:06:02<25:53:09, 6.05s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2425/17840 [4:06:02<25:53:09, 6.05s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:20,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:23,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:23,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:25,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:27,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:27,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:29,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:31,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:31,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:33,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:35,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:35,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:37,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:38,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:38,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:41,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:41,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:43,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:46,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:46,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:47,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:47,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:49,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:49,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.2465, 'learning_rate': 9.150237529691211e-05, 'epoch': 2.73} +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:53,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:53,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:57,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:47:57,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8404, 'learning_rate': 9.149643705463183e-05, 'epoch': 2.73} +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:01,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:01,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2436/17840 [4:06:49<23:01:55, 5.38s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2436/17840 [4:06:49<23:01:55, 5.38s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5964, 'learning_rate': 9.149049881235154e-05, 'epoch': 2.73} + 14%|█████████▉ | 2436/17840 [4:06:49<23:01:55, 5.38s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2436/17840 [4:06:49<23:01:55, 5.38s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2436/17840 [4:06:49<23:01:55, 5.38s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2437/17840 [4:06:56<25:45:47, 6.02s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:16,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:16,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:16,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2438/17840 [4:07:04<27:35:17, 6.45s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2438/17840 [4:07:04<27:35:17, 6.45s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2438/17840 [4:07:04<27:35:17, 6.45s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2438/17840 [4:07:04<27:35:17, 6.45s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2438/17840 [4:07:04<27:35:17, 6.45s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2439/17840 [4:07:11<28:44:07, 6.72s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2439/17840 [4:07:11<28:44:07, 6.72s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:32,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2440/17840 [4:07:18<29:26:40, 6.88s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2440/17840 [4:07:18<29:26:40, 6.88s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9629, 'learning_rate': 9.14667458432304e-05, 'epoch': 2.74} + 14%|█████████▉ | 2440/17840 [4:07:18<29:26:40, 6.88s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2440/17840 [4:07:18<29:26:40, 6.88s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2440/17840 [4:07:18<29:26:40, 6.88s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2441/17840 [4:07:26<29:53:09, 6.99s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2441/17840 [4:07:26<29:53:09, 6.99s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2441/17840 [4:07:26<29:53:09, 6.99s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:48,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:48,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6315, 'learning_rate': 9.145486935866983e-05, 'epoch': 2.74} +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:48,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:48,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:48:48,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2443/17840 [4:07:40<30:23:00, 7.10s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2443/17840 [4:07:40<30:23:00, 7.10s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2443/17840 [4:07:40<30:23:00, 7.10s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:03,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:03,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8296, 'learning_rate': 9.144299287410927e-05, 'epoch': 2.74} +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:03,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:03,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:03,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2445/17840 [4:07:54<30:26:38, 7.12s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2445/17840 [4:07:54<30:26:38, 7.12s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2445/17840 [4:07:54<30:26:38, 7.12s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:17,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:17,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8196, 'learning_rate': 9.14311163895487e-05, 'epoch': 2.74} +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:17,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:17,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:17,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2447/17840 [4:08:09<30:14:26, 7.07s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:27,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:27,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2448/17840 [4:08:15<29:59:26, 7.01s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2448/17840 [4:08:15<29:59:26, 7.01s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0644, 'learning_rate': 9.141923990498813e-05, 'epoch': 2.74} + 14%|██████████ | 2448/17840 [4:08:15<29:59:26, 7.01s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:38,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:38,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7384, 'learning_rate': 9.141330166270783e-05, 'epoch': 2.75} +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:38,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:49:38,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2450/17840 [4:08:32<32:43:18, 7.65s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2450/17840 [4:08:32<32:43:18, 7.65s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7411, 'learning_rate': 9.140736342042756e-05, 'epoch': 2.75} + 14%|██████████ | 2450/17840 [4:08:32<32:43:18, 7.65s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2450/17840 [4:08:32<32:43:18, 7.65s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2450/17840 [4:08:32<32:43:18, 7.65s/it]g-point operations will not be computed-17 20:47:07,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2451/17840 [4:08:38<31:42:06, 7.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:56,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2451/17840 [4:08:38<31:42:06, 7.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:56,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2451/17840 [4:08:38<31:42:06, 7.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:56,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2451/17840 [4:08:38<31:42:06, 7.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:56,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2452/17840 [4:08:45<30:56:44, 7.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:56,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2452/17840 [4:08:45<30:56:44, 7.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:49:56,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:06,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:49:56,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2453/17840 [4:08:52<30:28:40, 7.13s/it]g-point operations will not be computed-17 20:49:56,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2453/17840 [4:08:52<30:28:40, 7.13s/it]g-point operations will not be computed-17 20:49:56,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7164, 'learning_rate': 9.13895486935867e-05, 'epoch': 2.75} + 14%|██████████ | 2453/17840 [4:08:52<30:28:40, 7.13s/it]g-point operations will not be computed-17 20:49:56,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2453/17840 [4:08:52<30:28:40, 7.13s/it]g-point operations will not be computed-17 20:49:56,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2453/17840 [4:08:52<30:28:40, 7.13s/it]g-point operations will not be computed-17 20:49:56,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2454/17840 [4:08:59<30:08:14, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2454/17840 [4:08:59<30:08:14, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2454/17840 [4:08:59<30:08:14, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2454/17840 [4:08:59<30:08:14, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2455/17840 [4:09:06<29:50:45, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:25,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:25,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2456/17840 [4:09:12<29:25:18, 6.88s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2456/17840 [4:09:12<29:25:18, 6.88s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7334, 'learning_rate': 9.137173396674584e-05, 'epoch': 2.75} + 14%|██████████ | 2456/17840 [4:09:12<29:25:18, 6.88s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:34,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:34,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7859, 'learning_rate': 9.136579572446557e-05, 'epoch': 2.75} +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:34,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:34,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:34,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2458/17840 [4:09:26<28:50:02, 6.75s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:44,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:44,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2459/17840 [4:09:32<28:35:46, 6.69s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2459/17840 [4:09:32<28:35:46, 6.69s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:51,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:51,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2460/17840 [4:09:39<28:17:53, 6.62s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2460/17840 [4:09:39<28:17:53, 6.62s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5649, 'learning_rate': 9.13479809976247e-05, 'epoch': 2.76} +[WARNING|modeling_utils.py:388] 2022-03-17 20:50:59,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2461/17840 [4:09:45<28:03:19, 6.57s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2461/17840 [4:09:45<28:03:19, 6.57s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8711, 'learning_rate': 9.134204275534442e-05, 'epoch': 2.76} +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:05,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2462/17840 [4:09:51<27:49:20, 6.51s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2462/17840 [4:09:51<27:49:20, 6.51s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6743, 'learning_rate': 9.133610451306413e-05, 'epoch': 2.76} + 14%|██████████ | 2462/17840 [4:09:51<27:49:20, 6.51s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2462/17840 [4:09:51<27:49:20, 6.51s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2462/17840 [4:09:51<27:49:20, 6.51s/it]g-point operations will not be computed-17 20:50:16,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2463/17840 [4:09:58<27:40:21, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:15,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2463/17840 [4:09:58<27:40:21, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:15,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2463/17840 [4:09:58<27:40:21, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:15,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2463/17840 [4:09:58<27:40:21, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:15,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2464/17840 [4:10:04<27:28:30, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:21,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2464/17840 [4:10:04<27:28:30, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:21,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2464/17840 [4:10:04<27:28:30, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:21,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2464/17840 [4:10:04<27:28:30, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:21,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2465/17840 [4:10:10<27:11:31, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:28,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2465/17840 [4:10:10<27:11:31, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:28,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2465/17840 [4:10:10<27:11:31, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:28,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2465/17840 [4:10:10<27:11:31, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:28,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2466/17840 [4:10:17<26:57:12, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:34,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2466/17840 [4:10:17<26:57:12, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:34,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2466/17840 [4:10:17<26:57:12, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:34,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2466/17840 [4:10:17<26:57:12, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:34,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2467/17840 [4:10:23<26:36:51, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:40,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2467/17840 [4:10:23<26:36:51, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:40,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:44,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:40,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:44,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:40,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7829, 'learning_rate': 9.130047505938243e-05, 'epoch': 2.77} +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:44,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:40,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:44,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:40,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:44,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:40,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2469/17840 [4:10:35<26:00:56, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:52,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2469/17840 [4:10:35<26:00:56, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:51:52,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:56,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:52,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:51:56,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:52,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5577, 'learning_rate': 9.128859857482185e-05, 'epoch': 2.77} +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:00,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:52,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2471/17840 [4:10:46<25:04:38, 5.87s/it]g-point operations will not be computed-17 20:51:52,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2471/17840 [4:10:46<25:04:38, 5.87s/it]g-point operations will not be computed-17 20:51:52,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:04,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:52,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:04,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:51:52,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2472/17840 [4:10:51<24:36:52, 5.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:08,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2472/17840 [4:10:51<24:36:52, 5.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:08,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6604, 'learning_rate': 9.12767220902613e-05, 'epoch': 2.77} +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:12,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:08,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:12,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:08,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8449, 'learning_rate': 9.1270783847981e-05, 'epoch': 2.77} +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:16,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:08,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2474/17840 [4:11:02<23:32:09, 5.51s/it]g-point operations will not be computed-17 20:52:08,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2474/17840 [4:11:02<23:32:09, 5.51s/it]g-point operations will not be computed-17 20:52:08,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:20,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:08,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:20,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:08,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2475/17840 [4:11:09<25:30:58, 5.98s/it]g-point operations will not be computed-17 20:52:08,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2475/17840 [4:11:09<25:30:58, 5.98s/it]g-point operations will not be computed-17 20:52:08,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6364, 'learning_rate': 9.125890736342043e-05, 'epoch': 2.77} +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:28,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:08,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2476/17840 [4:11:14<23:52:20, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:30,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2476/17840 [4:11:14<23:52:20, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:30,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:33,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:30,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2477/17840 [4:11:18<22:19:55, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:35,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2477/17840 [4:11:18<22:19:55, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:35,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:37,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:35,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2478/17840 [4:11:22<20:47:07, 4.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:39,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2478/17840 [4:11:22<20:47:07, 4.87s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:39,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:40,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:39,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2479/17840 [4:11:26<19:19:13, 4.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:42,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2479/17840 [4:11:26<19:19:13, 4.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:42,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2480/17840 [4:11:29<17:49:44, 4.18s/it]g-point operations will not be computed-17 20:52:42,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2480/17840 [4:11:29<17:49:44, 4.18s/it]g-point operations will not be computed-17 20:52:42,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2480/17840 [4:11:29<17:49:44, 4.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:46,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2481/17840 [4:11:32<16:16:28, 3.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:48,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2481/17840 [4:11:32<16:16:28, 3.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:48,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2482/17840 [4:11:35<14:44:36, 3.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:51,478 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2482/17840 [4:11:35<14:44:36, 3.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:51,478 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2483/17840 [4:11:37<13:17:05, 3.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:53,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2483/17840 [4:11:37<13:17:05, 3.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:53,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:54,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:53,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:52:54,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:53,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2484/17840 [4:11:39<12:00:12, 2.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:57,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2484/17840 [4:11:39<12:00:12, 2.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:52:57,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:01,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:52:57,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2485/17840 [4:11:47<18:22:27, 4.31s/it]g-point operations will not be computed-17 20:52:57,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2485/17840 [4:11:47<18:22:27, 4.31s/it]g-point operations will not be computed-17 20:52:57,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2485/17840 [4:11:47<18:22:27, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2485/17840 [4:11:47<18:22:27, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:08,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2486/17840 [4:11:55<22:37:43, 5.31s/it]g-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2486/17840 [4:11:55<22:37:43, 5.31s/it]g-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2004, 'learning_rate': 9.11935866983373e-05, 'epoch': 2.79} + 14%|██████████▏ | 2486/17840 [4:11:55<22:37:43, 5.31s/it]g-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2486/17840 [4:11:55<22:37:43, 5.31s/it]g-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2487/17840 [4:12:02<25:31:31, 5.99s/it]g-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2487/17840 [4:12:02<25:31:31, 5.99s/it]g-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7947, 'learning_rate': 9.1187648456057e-05, 'epoch': 2.79} + 14%|██████████▏ | 2487/17840 [4:12:02<25:31:31, 5.99s/it]g-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2487/17840 [4:12:02<25:31:31, 5.99s/it]g-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:25,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:25,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:25,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:25,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:25,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2489/17840 [4:12:17<28:38:10, 6.72s/it]g-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2489/17840 [4:12:17<28:38:10, 6.72s/it]g-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2489/17840 [4:12:17<28:38:10, 6.72s/it]g-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2489/17840 [4:12:17<28:38:10, 6.72s/it]g-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2489/17840 [4:12:17<28:38:10, 6.72s/it]g-point operations will not be computed-17 20:53:05,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2490/17840 [4:12:24<29:22:36, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2490/17840 [4:12:24<29:22:36, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2490/17840 [4:12:24<29:22:36, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2490/17840 [4:12:24<29:22:36, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2491/17840 [4:12:32<29:55:42, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2491/17840 [4:12:32<29:55:42, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2491/17840 [4:12:32<29:55:42, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2491/17840 [4:12:32<29:55:42, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2491/17840 [4:12:32<29:55:42, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2492/17840 [4:12:39<30:16:35, 7.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:58,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:53:58,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2493/17840 [4:12:46<30:28:39, 7.15s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2493/17840 [4:12:46<30:28:39, 7.15s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.631, 'learning_rate': 9.11520190023753e-05, 'epoch': 2.79} + 14%|██████████▏ | 2493/17840 [4:12:46<30:28:39, 7.15s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2493/17840 [4:12:46<30:28:39, 7.15s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2493/17840 [4:12:46<30:28:39, 7.15s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2494/17840 [4:12:54<30:35:47, 7.18s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2494/17840 [4:12:54<30:35:47, 7.18s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:14,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2495/17840 [4:13:01<30:31:40, 7.16s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2495/17840 [4:13:01<30:31:40, 7.16s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5625, 'learning_rate': 9.114014251781473e-05, 'epoch': 2.8} + 14%|██████████▏ | 2495/17840 [4:13:01<30:31:40, 7.16s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2495/17840 [4:13:01<30:31:40, 7.16s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2495/17840 [4:13:01<30:31:40, 7.16s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2496/17840 [4:13:08<30:20:11, 7.12s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:27,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:27,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2497/17840 [4:13:15<30:16:49, 7.10s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2497/17840 [4:13:15<30:16:49, 7.10s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9454, 'learning_rate': 9.112826603325417e-05, 'epoch': 2.8} + 14%|██████████▏ | 2497/17840 [4:13:15<30:16:49, 7.10s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:37,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:37,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5342, 'learning_rate': 9.112232779097387e-05, 'epoch': 2.8} +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:37,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:37,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:37,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2499/17840 [4:13:29<29:53:08, 7.01s/it]g-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:48,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 20:54:48,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 20:53:42,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|trainer.py:2366] 2022-03-17 20:54:54,134 >> Num examples = 2642 | 2500/17840 [4:13:38<32:56:03, 7.73s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|trainer.py:2366] 2022-03-17 20:54:54,134 >> Num examples = 2642 | 2500/17840 [4:13:38<32:56:03, 7.73s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +{'loss': 3.4205, 'learning_rate': 9.11104513064133e-05, 'epoch': 2.8} +[INFO|trainer.py:2366] 2022-03-17 20:54:54,134 >> Num examples = 2642 | 2500/17840 [4:13:38<32:56:03, 7.73s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 1%|▊ | 3/331 [00:04<09:20, 1.71s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 1%|█ | 4/331 [00:07<10:47, 1.98s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|█▎ | 5/331 [00:10<13:26, 2.47s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|█▌ | 6/331 [00:14<15:18, 2.83s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|█▊ | 7/331 [00:16<15:00, 2.78s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|██ | 8/331 [00:20<15:42, 2.92s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 3%|██▎ | 9/331 [00:23<16:57, 3.16s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 3%|██▍ | 10/331 [00:28<19:00, 3.55s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 3%|██▋ | 11/331 [00:31<17:56, 3.37s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|██▉ | 12/331 [00:34<17:20, 3.26s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|███▏ | 13/331 [00:37<16:50, 3.18s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|███▍ | 14/331 [00:40<16:32, 3.13s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|███▋ | 15/331 [00:45<19:28, 3.70s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|███▉ | 16/331 [00:50<21:41, 4.13s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|████▏ | 17/331 [00:54<22:07, 4.23s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|████▍ | 18/331 [00:57<19:01, 3.65s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|████▋ | 19/331 [01:00<18:32, 3.56s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|████▉ | 20/331 [01:02<16:26, 3.17s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|█████▏ | 21/331 [01:06<17:46, 3.44s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 7%|█████▍ | 22/331 [01:11<20:18, 3.94s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 7%|█████▋ | 23/331 [01:17<23:10, 4.52s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 7%|█████▉ | 24/331 [01:23<25:23, 4.96s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▏ | 25/331 [01:27<23:56, 4.69s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▍ | 26/331 [01:30<21:14, 4.18s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▋ | 27/331 [01:35<21:30, 4.24s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▉ | 28/331 [01:38<20:26, 4.05s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|███████▏ | 29/331 [01:42<19:26, 3.86s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|███████▍ | 30/331 [01:45<17:57, 3.58s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|███████▋ | 31/331 [01:47<16:39, 3.33s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 10%|███████▉ | 32/331 [01:50<16:07, 3.23s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 10%|████████▏ | 33/331 [01:54<16:13, 3.27s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 10%|████████▍ | 34/331 [01:57<16:11, 3.27s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|████████▋ | 35/331 [02:01<16:43, 3.39s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|████████▉ | 36/331 [02:05<18:20, 3.73s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|█████████▏ | 37/331 [02:10<20:02, 4.09s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|█████████▍ | 38/331 [02:15<20:35, 4.22s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 12%|█████████▋ | 39/331 [02:19<20:47, 4.27s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 12%|█████████▉ | 40/331 [02:22<17:58, 3.71s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 12%|██████████▏ | 41/331 [02:24<16:24, 3.39s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▍ | 42/331 [02:29<18:32, 3.85s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▋ | 43/331 [02:34<20:06, 4.19s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▉ | 44/331 [02:39<21:15, 4.44s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 14%|███████████▏ | 45/331 [02:42<19:19, 4.06s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 14%|███████████▍ | 46/331 [02:45<16:56, 3.57s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 14%|███████████▋ | 47/331 [02:47<15:04, 3.18s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|███████████▉ | 48/331 [02:51<15:48, 3.35s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|████████████▏ | 49/331 [02:55<17:22, 3.70s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|████████████▍ | 50/331 [02:59<17:18, 3.70s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|████████████▋ | 51/331 [03:03<17:56, 3.84s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 16%|████████████▉ | 52/331 [03:06<16:40, 3.59s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 16%|█████████████▏ | 53/331 [03:10<16:45, 3.62s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 16%|█████████████▍ | 54/331 [03:12<15:15, 3.30s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|█████████████▋ | 55/331 [03:18<17:46, 3.86s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|█████████████▊ | 56/331 [03:21<17:21, 3.79s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|██████████████ | 57/331 [03:24<16:28, 3.61s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▎ | 58/331 [03:29<17:37, 3.87s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▌ | 59/331 [03:31<15:48, 3.49s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▊ | 60/331 [03:34<15:07, 3.35s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|███████████████ | 61/331 [03:39<16:12, 3.60s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 19%|███████████████▎ | 62/331 [03:42<15:37, 3.49s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 19%|███████████████▌ | 63/331 [03:47<18:06, 4.05s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 19%|███████████████▊ | 64/331 [03:50<16:53, 3.80s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████ | 65/331 [03:54<16:16, 3.67s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████▎ | 66/331 [04:00<19:08, 4.33s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████▌ | 67/331 [04:05<20:29, 4.66s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|████████████████▊ | 68/331 [04:10<20:35, 4.70s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████ | 69/331 [04:14<19:50, 4.54s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████▎ | 70/331 [04:18<19:30, 4.48s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████▌ | 71/331 [04:23<19:58, 4.61s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|█████████████████▊ | 72/331 [04:28<19:55, 4.61s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|██████████████████ | 73/331 [04:32<18:48, 4.37s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|██████████████████▎ | 74/331 [04:36<18:26, 4.30s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|██████████████████▌ | 75/331 [04:41<19:14, 4.51s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|██████████████████▊ | 76/331 [04:44<17:39, 4.16s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|███████████████████ | 77/331 [04:48<16:59, 4.01s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▎ | 78/331 [04:51<15:43, 3.73s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▌ | 79/331 [04:54<14:46, 3.52s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▊ | 80/331 [04:57<14:27, 3.46s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|████████████████████ | 81/331 [05:02<15:29, 3.72s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▎ | 82/331 [05:05<15:00, 3.62s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▌ | 83/331 [05:09<15:51, 3.84s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▊ | 84/331 [05:15<17:55, 4.36s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 26%|█████████████████████ | 85/331 [05:18<15:45, 3.84s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 26%|█████████████████████▎ | 86/331 [05:23<17:09, 4.20s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 26%|█████████████████████▌ | 87/331 [05:26<16:21, 4.02s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|█████████████████████▊ | 88/331 [05:30<15:34, 3.84s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|██████████████████████ | 89/331 [05:32<13:44, 3.41s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|██████████████████████▎ | 90/331 [05:35<12:39, 3.15s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|██████████████████████▌ | 91/331 [05:39<13:59, 3.50s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|██████████████████████▊ | 92/331 [05:41<12:25, 3.12s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|███████████████████████ | 93/331 [05:45<12:44, 3.21s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|███████████████████████▎ | 94/331 [05:48<13:20, 3.38s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 29%|███████████████████████▌ | 95/331 [05:52<13:32, 3.44s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 29%|███████████████████████▊ | 96/331 [05:56<13:47, 3.52s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 29%|████████████████████████ | 97/331 [05:58<12:48, 3.29s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 30%|████████████████████████▎ | 98/331 [06:02<13:43, 3.53s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 30%|████████████████████████▌ | 99/331 [06:06<13:41, 3.54s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 30%|████████████████████████▍ | 100/331 [06:09<12:38, 3.29s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|████████████████████████▋ | 101/331 [06:12<12:33, 3.28s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|████████████████████████▉ | 102/331 [06:17<14:34, 3.82s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|████████████████��████████▏ | 103/331 [06:20<13:22, 3.52s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|█████████████████████████▍ | 104/331 [06:23<13:08, 3.47s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 32%|█████████████████████████▋ | 105/331 [06:27<13:07, 3.49s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 32%|█████████████████████████▉ | 106/331 [06:30<13:10, 3.51s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 32%|██████████████████████████▏ | 107/331 [06:33<11:38, 3.12s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▍ | 108/331 [06:35<11:14, 3.02s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▋ | 109/331 [06:38<11:10, 3.02s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▉ | 110/331 [06:43<12:27, 3.38s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▏ | 111/331 [06:46<12:42, 3.47s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▍ | 112/331 [06:50<12:50, 3.52s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▋ | 113/331 [06:52<11:40, 3.21s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▉ | 114/331 [06:56<12:02, 3.33s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 35%|████████████████████████████▏ | 115/331 [06:59<12:10, 3.38s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 35%|████████████████████████████▍ | 116/331 [07:03<12:47, 3.57s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 35%|████████████████████████████▋ | 117/331 [07:07<12:48, 3.59s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 36%|████████████████████████████▉ | 118/331 [07:10<12:08, 3.42s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 36%|█████████████████████████████ | 119/331 [07:14<12:01, 3.40s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 36%|█████████████████████████████▎ | 120/331 [07:17<12:04, 3.43s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|█████████████████████████████▌ | 121/331 [07:22<13:09, 3.76s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|█████████████████████████████▊ | 122/331 [07:25<12:37, 3.62s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|██████████████████████████████ | 123/331 [07:30<14:10, 4.09s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|██████████████████████████████▎ | 124/331 [07:34<13:48, 4.00s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|██████████████████████████████▌ | 125/331 [07:39<15:04, 4.39s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|██████████████████████████████▊ | 126/331 [07:44<15:11, 4.44s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|███████████████████████████████ | 127/331 [07:49<16:02, 4.72s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▎ | 128/331 [07:54<16:10, 4.78s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▌ | 129/331 [07:58<15:37, 4.64s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▊ | 130/331 [08:03<15:59, 4.77s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████ | 131/331 [08:09<16:25, 4.93s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████▎ | 132/331 [08:12<15:08, 4.57s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████▌ | 133/331 [08:15<13:33, 4.11s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████���███████████████▊ | 134/331 [08:19<12:50, 3.91s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████ | 135/331 [08:23<13:11, 4.04s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████▎ | 136/331 [08:28<13:59, 4.30s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████▌ | 137/331 [08:33<14:41, 4.54s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|█████████████████████████████████▊ | 138/331 [08:38<15:08, 4.71s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|██████████████████████████████████ | 139/331 [08:40<12:37, 3.94s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|██████████████████████████████████▎ | 140/331 [08:46<14:10, 4.45s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 43%|██████████████████████████████████▌ | 141/331 [08:49<13:00, 4.11s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 43%|██████████████████████████████████▋ | 142/331 [08:53<12:31, 3.98s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 43%|██████████████████████████████████▉ | 143/331 [08:58<13:25, 4.29s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▏ | 144/331 [09:02<12:40, 4.07s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▍ | 145/331 [09:05<12:22, 3.99s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▋ | 146/331 [09:11<13:27, 4.36s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▉ | 147/331 [09:14<12:42, 4.14s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 45%|████████████████████████████████████▏ | 148/331 [09:17<11:30, 3.77s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 45%|████████████████████████████████████▍ | 149/331 [09:20<10:21, 3.41s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 45%|████████████████████████████████████▋ | 150/331 [09:24<11:10, 3.71s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 46%|████████████████████████████████████▉ | 151/331 [09:28<10:52, 3.63s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 46%|█████████████████████████████████████▏ | 152/331 [09:30<09:55, 3.33s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 46%|█████████████████████████████████████▍ | 153/331 [09:33<09:37, 3.25s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|█████████████████████████████████████▋ | 154/331 [09:38<10:36, 3.60s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|█████████████████████████████████████▉ | 155/331 [09:43<11:38, 3.97s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|██████████████████████████████████████▏ | 156/331 [09:47<12:23, 4.25s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|██████████████████████████████████████▍ | 157/331 [09:53<13:09, 4.54s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|██████████████████████████████████████▋ | 158/331 [09:58<13:25, 4.65s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|██████████████████████████████████████▉ | 159/331 [10:02<13:19, 4.65s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|███████████████████████████████████████▏ | 160/331 [10:06<12:06, 4.25s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▍ | 161/331 [10:09<11:34, 4.09s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▋ | 162/331 [10:15<12:28, 4.43s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▉ | 163/331 [10:19<12:35, 4.50s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|███████████████████████████████��████████▏ | 164/331 [10:23<11:47, 4.23s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▍ | 165/331 [10:27<11:20, 4.10s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▌ | 166/331 [10:30<10:51, 3.95s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▊ | 167/331 [10:35<11:13, 4.11s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████ | 168/331 [10:38<10:15, 3.78s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████▎ | 169/331 [10:42<10:35, 3.92s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████▌ | 170/331 [10:45<09:41, 3.61s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 52%|█████████████████████████████████████████▊ | 171/331 [10:48<09:34, 3.59s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 52%|██████████████████████████████████████████ | 172/331 [10:51<08:52, 3.35s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 52%|██████████████████████████████████████████▎ | 173/331 [10:55<09:20, 3.55s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|████���█████████████████████████████████████▌ | 174/331 [10:58<08:43, 3.33s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|██████████████████████████████████████████▊ | 175/331 [11:02<08:59, 3.46s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|███████████████████████████████████████████ | 176/331 [11:05<08:31, 3.30s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|███████████████████████████████████████████▎ | 177/331 [11:09<09:23, 3.66s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 54%|███████████████████████████████████████████▌ | 178/331 [11:14<10:30, 4.12s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 54%|███████████████████████████████████████████▊ | 179/331 [11:20<11:17, 4.46s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 54%|████████████████████████████████████████████ | 180/331 [11:24<10:59, 4.37s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|████████████████████████████████████████████▎ | 181/331 [11:28<10:49, 4.33s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|████████████████████████████████████████████▌ | 182/331 [11:31<09:26, 3.80s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|████████████████████████████████████████████▊ | 183/331 [11:33<08:17, 3.36s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████ | 184/331 [11:35<07:25, 3.03s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▎ | 185/331 [11:37<06:34, 2.70s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▌ | 186/331 [11:41<07:02, 2.92s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▊ | 187/331 [11:45<08:20, 3.47s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 57%|██████████████████████████████████████████████ | 188/331 [11:49<08:19, 3.49s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 57%|██████████████████████████████████████████████▎ | 189/331 [11:51<07:35, 3.21s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 57%|██████████████████████████████████████████████▍ | 190/331 [11:54<07:04, 3.01s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|██████████████████████████████████████████████▋ | 191/331 [11:57<06:57, 2.98s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|██████████████████████████████████████████████▉ | 192/331 [11:59<06:35, 2.85s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|███████████████████████████████████████████████▏ | 193/331 [12:04<07:39, 3.33s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 59%|███████████████████████████████████████████████▍ | 194/331 [12:06<06:56, 3.04s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 59%|███████████████████████████████████████████████▋ | 195/331 [12:09<06:38, 2.93s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 59%|███████████████████████████████████████████████▉ | 196/331 [12:12<06:55, 3.08s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▏ | 197/331 [12:16<07:36, 3.41s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▍ | 198/331 [12:19<06:56, 3.13s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▋ | 199/331 [12:22<07:09, 3.26s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▉ | 200/331 [12:25<06:30, 2.98s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|█████████████████████████████████████████████████▏ | 201/331 [12:28<06:19, 2.92s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|█████████████████████████████████████████████████▍ | 202/331 [12:31<06:43, 3.13s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|███���█████████████████████████████████████████████▋ | 203/331 [12:35<06:48, 3.19s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|█████████████████████████████████████████████████▉ | 204/331 [12:39<07:33, 3.57s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|██████████████████████████████████████████████████▏ | 205/331 [12:43<07:44, 3.69s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|██████████████████████████████████████████████████▍ | 206/331 [12:47<07:37, 3.66s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|██████████████████████████████████████████████████▋ | 207/331 [12:51<08:14, 3.99s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|██████████████████████████████████████████████████▉ | 208/331 [12:56<08:26, 4.12s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|███████████████████████████████████████████████████▏ | 209/331 [12:58<07:19, 3.60s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|███████████████████████████████████████████████████▍ | 210/331 [13:00<06:28, 3.21s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 64%|███████████████████████████████████████████████████▋ | 211/331 [13:04<06:37, 3.31s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 64%|███████████████████████████████████████████████████▉ | 212/331 [13:06<06:05, 3.07s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 64%|████████████████████████████████████████████████████ | 213/331 [13:10<06:09, 3.13s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▎ | 214/331 [13:12<05:37, 2.89s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▌ | 215/331 [13:14<05:10, 2.67s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▊ | 216/331 [13:19<06:20, 3.31s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████ | 217/331 [13:22<06:16, 3.30s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████▎ | 218/331 [13:27<06:51, 3.65s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████▌ | 219/331 [13:30<06:42, 3.59s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████▊ | 220/331 [13:33<06:12, 3.36s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████ | 221/331 [13:37<06:20, 3.46s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████▎ | 222/331 [13:39<05:49, 3.20s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████▌ | 223/331 [13:43<05:57, 3.31s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|██████████████████████████████████████████████████████▊ | 224/331 [13:46<06:02, 3.39s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|███████████████████████████████████████████████████████ | 225/331 [13:50<06:04, 3.44s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|███████████████████████████████████████████████████████▎ | 226/331 [13:55<06:39, 3.80s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|███████████████████████████████████████████████████████▌ | 227/331 [13:58<06:25, 3.71s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|███████████████████████████████████████████████████████▊ | 228/331 [14:01<06:07, 3.57s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|████████████████████████████████████████████████████████ | 229/331 [14:05<05:57, 3.51s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|████████████████████████████████████████████████████████▎ | 230/331 [14:08<05:39, 3.36s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|█████████████████████████████████████████████████���██████▌ | 231/331 [14:12<05:57, 3.57s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|████████████████████████████████████████████████████████▊ | 232/331 [14:15<05:46, 3.50s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|█████████████████████████████████████████████████████████ | 233/331 [14:19<06:06, 3.74s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|█████████████████████████████████████████████████████████▎ | 234/331 [14:22<05:33, 3.44s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|█████████████████████████████████████████████████████████▌ | 235/331 [14:25<05:11, 3.25s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|█████████████████████████████████████████████████████████▊ | 236/331 [14:31<06:18, 3.98s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|█████████████████████████████████████████████████████████▉ | 237/331 [14:36<06:46, 4.33s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|██████████████████████████████████████████████████████████▏ | 238/331 [14:40<06:39, 4.30s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|██████████████████████████████████████████████████████████▍ | 239/331 [14:44<06:37, 4.33s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|██████████████████████████████████████████████████████████▋ | 240/331 [14:49<06:51, 4.52s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|██████████████████████████████████████████████████████████▉ | 241/331 [14:55<07:01, 4.69s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|███████████████████████████████████████████████████████████▏ | 242/331 [14:59<07:04, 4.77s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|███████████████████████████████████████████████████████████▍ | 243/331 [15:04<06:56, 4.74s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|███████████████████████████████████████████████████████████▋ | 244/331 [15:09<07:07, 4.92s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|███████████████████████████████████████████████████████████▉ | 245/331 [15:14<06:44, 4.70s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|████████████████████████████████████████████████████████████▏ | 246/331 [15:20<07:08, 5.05s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 75%|████████████████████████████████████████████████████████████▍ | 247/331 [15:24<06:43, 4.81s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 75%|████████████████████████████████████████████████████████████▋ | 248/331 [15:27<06:01, 4.36s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 75%|████████████████████████████████████████████████████████████▉ | 249/331 [15:30<05:14, 3.84s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▏ | 250/331 [15:33<04:47, 3.55s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▍ | 251/331 [15:37<04:56, 3.71s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▋ | 252/331 [15:39<04:30, 3.42s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▉ | 253/331 [15:44<04:53, 3.76s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▏ | 254/331 [15:47<04:39, 3.63s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▍ | 255/331 [15:52<04:55, 3.88s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▋ | 256/331 [15:55<04:38, 3.71s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|██████████████████████████████████████████████████████████████▉ | 257/331 [16:00<04:51, 3.94s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|███████████████████████████████████████████████████████████████▏ | 258/331 [16:02<04:19, 3.55s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|███████████████████████████████████████████████████████████████▍ | 259/331 [16:06<04:11, 3.50s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|███████████████████████████████████████████████████████████████▋ | 260/331 [16:10<04:20, 3.67s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|███████████████████████████████████████████████████████████████▊ | 261/331 [16:12<03:51, 3.30s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|████████████████████████████████████████████████████████████████ | 262/331 [16:16<03:50, 3.35s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|████████████████████████████████████████████████████████████████▎ | 263/331 [16:20<04:12, 3.71s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|████████████████████████████████████████████████████████████████▌ | 264/331 [16:23<03:56, 3.53s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|████████████████████████████████████████████████████████████████▊ | 265/331 [16:26<03:44, 3.41s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|█████████████████████████████████████████████████████████████████ | 266/331 [16:29<03:34, 3.30s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 81%|█████████████████████████████████████████████████████████████████▎ | 267/331 [16:34<03:55, 3.68s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 81%|█████████████████████████████████████████████████████████████████▌ | 268/331 [16:38<03:49, 3.65s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 81%|█████████████████████████████████████████████████████████████████▊ | 269/331 [16:43<04:14, 4.10s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████ | 270/331 [16:47<04:05, 4.02s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▎ | 271/331 [16:52<04:18, 4.32s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▌ | 272/331 [16:55<03:57, 4.03s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▊ | 273/331 [16:59<03:57, 4.09s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 83%|███████████████████████████████████████████████████████████████████ | 274/331 [17:04<04:12, 4.43s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 83%|███████████████████████████████████████████████████████████████████▎ | 275/331 [17:09<04:10, 4.48s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 83%|███████████████████████████████████████████████████████████████████▌ | 276/331 [17:12<03:43, 4.06s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 84%|███████████████████████████████████████████████████████████████████▊ | 277/331 [17:16<03:31, 3.91s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 84%|████████████████████████████████████████████████████████████████████ | 278/331 [17:19<03:22, 3.83s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 84%|████████████████████████████████████████████████████████████████████▎ | 279/331 [17:25<03:49, 4.41s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|████████████████████████████████████████████████████████████████████▌ | 280/331 [17:29<03:36, 4.24s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|████████████████████████████████████████████████████████████████████▊ | 281/331 [17:34<03:43, 4.47s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|█████████████████████████████████████████████████████████████████████ | 282/331 [17:38<03:37, 4.43s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|█████████████████████████████████████████████████████████████████████▎ | 283/331 [17:43<03:42, 4.63s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▍ | 284/331 [17:49<03:47, 4.84s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▋ | 285/331 [17:54<03:47, 4.94s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▉ | 286/331 [17:59<03:45, 5.01s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 87%|██████████████████████████████████████████████████████████████████████▏ | 287/331 [18:05<03:50, 5.23s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 87%|██████████████████████████████████████████████████████████████████████▍ | 288/331 [18:10<03:44, 5.21s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 87%|██████████████████████████████████████████████████████████████████████▋ | 289/331 [18:13<03:18, 4.73s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 88%|██████████████████████████████████████████████████████████████████████▉ | 290/331 [18:17<02:57, 4.32s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 88%|███████████████████████████████████████████████████████████████████████▏ | 291/331 [18:20<02:37, 3.93s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 88%|███████████████████████████████████████████████████████████████████████▍ | 292/331 [18:23<02:26, 3.75s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|███████████████████████████████████████████████████████████████████████▋ | 293/331 [18:27<02:21, 3.74s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|███████████████████████████████████████████████████████████████████████▉ | 294/331 [18:30<02:07, 3.44s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|████████████████████████████████████████████████████████████████████████▏ | 295/331 [18:33<01:57, 3.27s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|████████████████████████████████████████████████████████████████████████▍ | 296/331 [18:35<01:47, 3.07s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|████████████████████████████████████████████████████████████████████████▋ | 297/331 [18:40<02:06, 3.73s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|████████████████████████████████████████████████████████████████████████▉ | 298/331 [18:46<02:19, 4.22s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|█████████████████████████████████████████████████████████████████████████▏ | 299/331 [18:49<02:07, 3.98s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|█████████████████████████████████████████████████████████████████████████▏ | 299/331 [18:49<02:07, 3.98s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|█████████████████████████████████████████████████████████████████████████▏ | 299/331 [18:49<02:07, 3.98s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 91%|█████████████████████████████████████████████████████████████████████████▋ | 301/331 [18:57<01:55, 3.83s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 91%|█████████████████████████████████████████████████████████████████████████▉ | 302/331 [19:00<01:46, 3.68s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▏ | 303/331 [19:03<01:37, 3.47s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▍ | 304/331 [19:07<01:40, 3.71s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▋ | 305/331 [19:12<01:42, 3.96s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▉ | 306/331 [19:17<01:49, 4.36s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▏ | 307/331 [19:22<01:52, 4.67s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▎ | 308/331 [19:28<01:54, 4.99s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▌ | 309/331 [19:33<01:52, 5.10s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|███████████████████████████████████████████████████████████████████████████▊ | 310/331 [19:37<01:35, 4.57s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|█████████��██████████████████████████████████████████████████████████████████ | 311/331 [19:41<01:31, 4.55s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|████████████████████████████████████████████████████████████████████████████▎ | 312/331 [19:44<01:17, 4.09s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|████████████████████████████████████████████████████████████████████████████▌ | 313/331 [19:48<01:10, 3.92s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|████████████████████████████████████████████████████████████████████████████▊ | 314/331 [19:52<01:09, 4.07s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|█████████████████████████████████████████████████████████████████████████████ | 315/331 [19:57<01:07, 4.24s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|█████████████████████████████████████████████████████████████████████████████▎ | 316/331 [20:01<01:04, 4.29s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 96%|█████████████████████████████████████████████████████████████████████████████▌ | 317/331 [20:07<01:04, 4.59s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 96%|█████████████████████████████████████████████████████████████████████████████▊ | 318/331 [20:10<00:53, 4.15s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 96%|██████████████████████████████████████████████████████████████████████████████ | 319/331 [20:13<00:45, 3.82s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 97%|██████████████████████████████████████████████████████████████████████████████▎ | 320/331 [20:17<00:43, 3.93s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 97%|██████████████████████████████████████████████████████████████████████████████▌ | 321/331 [20:21<00:38, 3.86s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 97%|██████████████████████████████████████████████████████████████████████████████▊ | 322/331 [20:26<00:38, 4.24s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████ | 323/331 [20:29<00:32, 4.04s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▎ | 324/331 [20:34<00:30, 4.35s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▌ | 325/331 [20:39<00:26, 4.38s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▊ | 326/331 [20:43<00:22, 4.43s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 99%|████████████████████████████████████████████████████████████████████████████████ | 327/331 [20:48<00:17, 4.43s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 99%|██████████████████████████████████████████████████████████��█████████████████████▎| 328/331 [20:53<00:13, 4.53s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 99%|████████████████████████████████████████████████████████████████████████████████▌| 329/331 [20:57<00:08, 4.37s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +100%|████████████████████████████████████████████████████████████████████████████████▊| 330/331 [21:02<00:04, 4.67s/it][INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|configuration_utils.py:438] 2022-03-17 21:16:01,629 >> Configuration saved in ./checkpoint-2500/config.json [INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|configuration_utils.py:438] 2022-03-17 21:16:01,629 >> Configuration saved in ./checkpoint-2500/config.json [INFO|trainer.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +03/17/2022 21:16:01 - INFO - datasets.metric - Removing /home/sanchit_huggingface_co/.cache/huggingface/metrics/wer/default/default_experiment-1-0.arrow +[INFO|feature_extraction_utils.py:324] 2022-03-17 21:16:06,468 >> Configuration saved in ./checkpoint-2500/preprocessor_config.jsoner.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|feature_extraction_utils.py:324] 2022-03-17 21:16:06,468 >> Configuration saved in ./checkpoint-2500/preprocessor_config.jsoner.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|feature_extraction_utils.py:324] 2022-03-17 21:16:06,468 >> Configuration saved in ./checkpoint-2500/preprocessor_config.jsoner.py:560] 2022-03-17 20:54:54,130 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +03/17/2022 21:16:26 - WARNING - huggingface_hub.repository - Adding files tracked by Git LFS: ['wandb/run-20220317_164114-2vzd8l55/run-2vzd8l55.wandb']. This may take a bit of time if the files are large.