diff --git "a/wandb/run-20220318_085758-21ccfwts/files/output.log" "b/wandb/run-20220318_085758-21ccfwts/files/output.log" new file mode 100644--- /dev/null +++ "b/wandb/run-20220318_085758-21ccfwts/files/output.log" @@ -0,0 +1,10009 @@ + + + 0%| | 0/17840 [00:00> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:03,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:05,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4762, 'learning_rate': 0.0, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:07,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 1/17840 [00:08<41:04:26, 8.29s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:58:09,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:11,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:13,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:15,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 2/17840 [00:16<39:24:47, 7.95s/it] + + 0%| | 2/17840 [00:16<39:24:47, 7.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:58:17,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:19,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:20,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:22,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 3/17840 [00:23<38:21:55, 7.74s/it] + + 0%| | 3/17840 [00:23<38:21:55, 7.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:58:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:26,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:28,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:30,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 4/17840 [00:30<37:31:45, 7.57s/it] + + 0%| | 4/17840 [00:30<37:31:45, 7.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:58:31,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:33,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:35,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:37,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 5/17840 [00:38<36:57:47, 7.46s/it] + + 0%| | 5/17840 [00:38<36:57:47, 7.46s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:58:39,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:41,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:42,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3832, 'learning_rate': 5.000000000000001e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:44,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 6/17840 [00:45<36:47:04, 7.43s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:58:46,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:48,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:50,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4092, 'learning_rate': 6.000000000000001e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:51,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 7/17840 [00:52<36:27:03, 7.36s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:58:53,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:55,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:57,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3223, 'learning_rate': 6.000000000000001e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-18 08:58:59,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 8/17840 [00:59<36:08:23, 7.30s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:59:00,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:02,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:04,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.5404, 'learning_rate': 7.000000000000001e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:06,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 9/17840 [01:06<35:52:26, 7.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:59:08,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:09,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:11,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4736, 'learning_rate': 8.000000000000001e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:13,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 10/17840 [01:14<35:37:02, 7.19s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:59:15,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:16,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:18,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:20,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 11/17840 [01:20<35:14:54, 7.12s/it] + + 0%| | 11/17840 [01:20<35:14:54, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:59:22,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:23,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:25,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4477, 'learning_rate': 1.0000000000000002e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:27,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 12/17840 [01:27<34:58:43, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:59:28,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:30,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:32,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:34,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 13/17840 [01:34<34:45:34, 7.02s/it] + + 0%| | 13/17840 [01:34<34:45:34, 7.02s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:59:35,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:37,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:39,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2868, 'learning_rate': 1.2000000000000002e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:40,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 14/17840 [01:41<34:30:20, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:59:42,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:44,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:46,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2492, 'learning_rate': 1.3e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:47,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 15/17840 [01:48<34:16:56, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:59:49,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:51,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:52,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:54,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 16/17840 [01:55<34:00:13, 6.87s/it] + + 0%| | 16/17840 [01:55<34:00:13, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 08:59:56,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:57,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 08:59:59,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:01,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3069, 'learning_rate': 1.5e-06, 'epoch': 0.02} + 0%| | 17/17840 [02:01<33:45:23, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:00:02,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:04,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:06,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4547, 'learning_rate': 1.6000000000000001e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:07,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 18/17840 [02:08<33:29:19, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:00:09,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:11,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:12,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1389, 'learning_rate': 1.7000000000000002e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:14,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 19/17840 [02:15<33:21:31, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:00:16,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:17,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:19,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:21,108 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 20/17840 [02:21<33:13:04, 6.71s/it] + + 0%| | 20/17840 [02:21<33:13:04, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:00:22,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:24,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:26,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:27,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1764, 'learning_rate': 1.9e-06, 'epoch': 0.02} + 0%| | 21/17840 [02:28<32:58:59, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:00:29,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:30,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:32,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1739, 'learning_rate': 2.0000000000000003e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:34,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 22/17840 [02:34<32:43:28, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:00:35,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:37,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:38,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1839, 'learning_rate': 2.1000000000000002e-06, 'epoch': 0.03} +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:40,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 23/17840 [02:41<32:25:14, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:00:42,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:43,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:45,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2356, 'learning_rate': 2.2e-06, 'epoch': 0.03} +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:46,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 24/17840 [02:47<32:12:15, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:00:48,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:50,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:51,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:53,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 25/17840 [02:54<32:41:15, 6.61s/it] + 0%| | 25/17840 [02:54<32:41:15, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:00:55,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:58,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:00:55,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:00:58,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:00:55,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:01:00,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 26/17840 [03:00<32:21:33, 6.54s/it] + 0%| | 26/17840 [03:00<32:21:33, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:01,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 26/17840 [03:00<32:21:33, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:01,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [03:07<31:55:14, 6.45s/it]g-point operations will not be computed-18 09:01:01,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [03:07<31:55:14, 6.45s/it]g-point operations will not be computed-18 09:01:01,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [03:07<31:55:14, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:08,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [03:07<31:55:14, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:08,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:13<31:31:10, 6.37s/it]g-point operations will not be computed-18 09:01:08,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:13<31:31:10, 6.37s/it]g-point operations will not be computed-18 09:01:08,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:13<31:31:10, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:14,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [03:13<31:31:10, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:14,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:19<31:14:45, 6.32s/it]g-point operations will not be computed-18 09:01:14,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:19<31:14:45, 6.32s/it]g-point operations will not be computed-18 09:01:14,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:19<31:14:45, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:20,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:19<31:14:45, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:20,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:25<30:59:49, 6.27s/it]g-point operations will not be computed-18 09:01:20,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:25<30:59:49, 6.27s/it]g-point operations will not be computed-18 09:01:20,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:25<30:59:49, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:26,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:25<30:59:49, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:26,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:25<30:59:49, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:26,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 31/17840 [03:31<30:49:53, 6.23s/it]g-point operations will not be computed-18 09:01:26,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 31/17840 [03:31<30:49:53, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:32,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:01:35,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:01:32,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:01:35,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:01:32,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 32/17840 [03:37<30:23:07, 6.14s/it]g-point operations will not be computed-18 09:01:32,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 32/17840 [03:37<30:23:07, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:38,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:01:41,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:01:38,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:01:41,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:01:38,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 33/17840 [03:43<30:02:51, 6.07s/it]g-point operations will not be computed-18 09:01:38,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 33/17840 [03:43<30:02:51, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:44,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:01:47,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:01:44,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:01:47,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:01:44,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 34/17840 [03:49<29:25:14, 5.95s/it]g-point operations will not be computed-18 09:01:44,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 34/17840 [03:49<29:25:14, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:50,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:01:52,851 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:01:50,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:01:52,851 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:01:50,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 35/17840 [03:55<28:55:50, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:55,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 35/17840 [03:55<28:55:50, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:01:55,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 36/17840 [04:00<28:28:52, 5.76s/it]g-point operations will not be computed-18 09:01:55,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 36/17840 [04:00<28:28:52, 5.76s/it]g-point operations will not be computed-18 09:01:55,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 36/17840 [04:00<28:28:52, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:01,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:03,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:01,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:03,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:01,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 37/17840 [04:06<28:00:33, 5.66s/it]g-point operations will not be computed-18 09:02:01,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 37/17840 [04:06<28:00:33, 5.66s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:06,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 09:02:06,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 09:02:06,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 38/17840 [04:11<27:24:25, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:11,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:14,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:11,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:14,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:11,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 39/17840 [04:16<26:49:37, 5.43s/it]g-point operations will not be computed-18 09:02:11,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 39/17840 [04:16<26:49:37, 5.43s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:16,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:19,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:16,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:19,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:16,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 40/17840 [04:21<26:12:57, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:21,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:24,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:21,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:24,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:21,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 41/17840 [04:26<25:28:10, 5.15s/it]g-point operations will not be computed-18 09:02:21,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 41/17840 [04:26<25:28:10, 5.15s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:26,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 41/17840 [04:26<25:28:10, 5.15s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:26,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 42/17840 [04:30<24:30:51, 4.96s/it]g-point operations will not be computed-18 09:02:26,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:33,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:31,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:33,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:31,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 43/17840 [04:34<23:23:38, 4.73s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:35,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:37,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:35,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:37,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:35,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 44/17840 [04:38<22:08:36, 4.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:39,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:40,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:39,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:40,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:39,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 45/17840 [04:42<20:37:07, 4.17s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:42,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 46/17840 [04:45<19:06:18, 3.87s/it]g-point operations will not be computed-18 09:02:42,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 46/17840 [04:45<19:06:18, 3.87s/it]g-point operations will not be computed-18 09:02:42,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:46,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:45,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:02:46,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:45,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 47/17840 [04:48<17:34:20, 3.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:48,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 47/17840 [04:48<17:34:20, 3.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:48,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 48/17840 [04:50<16:01:36, 3.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:50,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 48/17840 [04:50<16:01:36, 3.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:50,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 49/17840 [04:53<14:33:01, 2.94s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:52,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [04:55<13:57:19, 2.82s/it]g-point operations will not be computed-18 09:02:52,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [04:55<13:57:19, 2.82s/it]g-point operations will not be computed-18 09:02:52,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [04:55<13:57:19, 2.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:56,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [04:55<13:57:19, 2.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:02:56,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:03:00,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:02:56,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [05:03<21:09:32, 4.28s/it]g-point operations will not be computed-18 09:02:56,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [05:03<21:09:32, 4.28s/it]g-point operations will not be computed-18 09:02:56,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [05:03<21:09:32, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:04,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [05:03<21:09:32, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:04,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:03:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:03:04,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:03:08,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:03:04,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [05:10<25:47:38, 5.22s/it]g-point operations will not be computed-18 09:03:04,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [05:10<25:47:38, 5.22s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:11,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [05:10<25:47:38, 5.22s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:11,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 53/17840 [05:18<29:02:32, 5.88s/it]g-point operations will not be computed-18 09:03:11,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 53/17840 [05:18<29:02:32, 5.88s/it]g-point operations will not be computed-18 09:03:11,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 53/17840 [05:18<29:02:32, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:19,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 53/17840 [05:18<29:02:32, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:19,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:03:22,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:03:19,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:03:22,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:03:19,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:25<31:01:47, 6.28s/it]g-point operations will not be computed-18 09:03:19,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:25<31:01:47, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:26,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [05:25<31:01:47, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:26,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 09:03:26,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 09:03:26,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:32<32:24:59, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:33,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:32<32:24:59, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:33,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:03:37,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:03:33,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:39<33:22:48, 6.76s/it]g-point operations will not be computed-18 09:03:33,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:39<33:22:48, 6.76s/it]g-point operations will not be computed-18 09:03:33,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:39<33:22:48, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:40,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:39<33:22:48, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:40,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:03:44,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:03:40,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:03:44,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:03:40,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 57/17840 [05:46<33:56:44, 6.87s/it]g-point operations will not be computed-18 09:03:40,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 57/17840 [05:46<33:56:44, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:47,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:03:51,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:03:47,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [05:54<34:22:11, 6.96s/it]g-point operations will not be computed-18 09:03:47,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [05:54<34:22:11, 6.96s/it]g-point operations will not be computed-18 09:03:47,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [05:54<34:22:11, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:55,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [05:54<34:22:11, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:03:55,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:01<34:26:31, 6.97s/it]g-point operations will not be computed-18 09:03:55,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:01<34:26:31, 6.97s/it]g-point operations will not be computed-18 09:03:55,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:01<34:26:31, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:02,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [06:01<34:26:31, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:02,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:04:05,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:04:02,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [06:08<34:34:32, 7.00s/it]g-point operations will not be computed-18 09:04:02,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [06:08<34:34:32, 7.00s/it]g-point operations will not be computed-18 09:04:02,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [06:08<34:34:32, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:09,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [06:08<34:34:32, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:09,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:15<34:33:08, 7.00s/it]g-point operations will not be computed-18 09:04:09,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:15<34:33:08, 7.00s/it]g-point operations will not be computed-18 09:04:09,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:15<34:33:08, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:16,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [06:15<34:33:08, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:16,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:04:19,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:04:16,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:04:19,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:04:16,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 62/17840 [06:21<34:23:34, 6.96s/it]g-point operations will not be computed-18 09:04:16,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 62/17840 [06:21<34:23:34, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:22,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:04:26,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:04:22,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:28<34:12:26, 6.93s/it]g-point operations will not be computed-18 09:04:22,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:28<34:12:26, 6.93s/it]g-point operations will not be computed-18 09:04:22,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:28<34:12:26, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:29,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [06:28<34:12:26, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:29,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:35<34:02:31, 6.89s/it]g-point operations will not be computed-18 09:04:29,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:35<34:02:31, 6.89s/it]g-point operations will not be computed-18 09:04:29,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:35<34:02:31, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:36,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:35<34:02:31, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:36,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:04:40,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:04:36,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:04:40,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:04:36,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 65/17840 [06:42<33:58:24, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:43,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 65/17840 [06:42<33:58:24, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:43,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:04:46,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:04:43,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [06:49<33:39:07, 6.82s/it]g-point operations will not be computed-18 09:04:43,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [06:49<33:39:07, 6.82s/it]g-point operations will not be computed-18 09:04:43,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [06:49<33:39:07, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:50,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [06:49<33:39:07, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:50,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [06:55<33:29:44, 6.78s/it]g-point operations will not be computed-18 09:04:50,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [06:55<33:29:44, 6.78s/it]g-point operations will not be computed-18 09:04:50,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [06:55<33:29:44, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:56,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [06:55<33:29:44, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:04:56,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:05:00,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:04:56,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:05:00,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:04:56,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [07:02<33:14:21, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:03,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [07:02<33:14:21, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:03,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:05:06,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:05:03,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [07:09<33:02:19, 6.69s/it]g-point operations will not be computed-18 09:05:03,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [07:09<33:02:19, 6.69s/it]g-point operations will not be computed-18 09:05:03,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [07:09<33:02:19, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:10,056 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:05:13,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:05:10,056 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 70/17840 [07:15<32:54:54, 6.67s/it]g-point operations will not be computed-18 09:05:10,056 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 70/17840 [07:15<32:54:54, 6.67s/it]g-point operations will not be computed-18 09:05:10,056 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 70/17840 [07:15<32:54:54, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:16,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:05:19,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:05:16,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 71/17840 [07:22<32:44:52, 6.63s/it]g-point operations will not be computed-18 09:05:16,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 71/17840 [07:22<32:44:52, 6.63s/it]g-point operations will not be computed-18 09:05:16,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 71/17840 [07:22<32:44:52, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:23,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 71/17840 [07:22<32:44:52, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:23,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 72/17840 [07:28<32:39:12, 6.62s/it]g-point operations will not be computed-18 09:05:23,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 72/17840 [07:28<32:39:12, 6.62s/it]g-point operations will not be computed-18 09:05:23,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 72/17840 [07:28<32:39:12, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:29,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 72/17840 [07:28<32:39:12, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:29,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 09:05:29,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 09:05:29,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 73/17840 [07:35<32:27:22, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:36,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 73/17840 [07:35<32:27:22, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:36,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:05:39,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:05:36,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [07:41<32:26:39, 6.57s/it]g-point operations will not be computed-18 09:05:36,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [07:41<32:26:39, 6.57s/it]g-point operations will not be computed-18 09:05:36,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [07:41<32:26:39, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:42,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:05:45,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:05:42,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [07:48<32:57:04, 6.68s/it]g-point operations will not be computed-18 09:05:42,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [07:48<32:57:04, 6.68s/it]g-point operations will not be computed-18 09:05:42,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [07:48<32:57:04, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:49,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [07:48<32:57:04, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:49,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 76/17840 [07:55<32:22:32, 6.56s/it]g-point operations will not be computed-18 09:05:49,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 76/17840 [07:55<32:22:32, 6.56s/it]g-point operations will not be computed-18 09:05:49,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 76/17840 [07:55<32:22:32, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:55,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 76/17840 [07:55<32:22:32, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:55,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 76/17840 [07:55<32:22:32, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:05:55,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [08:01<31:58:28, 6.48s/it]g-point operations will not be computed-18 09:05:55,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [08:01<31:58:28, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:02,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [08:01<31:58:28, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:02,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [08:01<31:58:28, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:02,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 78/17840 [08:07<31:37:21, 6.41s/it]g-point operations will not be computed-18 09:06:02,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 78/17840 [08:07<31:37:21, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:08,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 78/17840 [08:07<31:37:21, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:08,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 78/17840 [08:07<31:37:21, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:08,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 79/17840 [08:13<31:14:56, 6.33s/it]g-point operations will not be computed-18 09:06:08,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 79/17840 [08:13<31:14:56, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:14,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 79/17840 [08:13<31:14:56, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:14,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 79/17840 [08:13<31:14:56, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:14,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 80/17840 [08:19<30:52:33, 6.26s/it]g-point operations will not be computed-18 09:06:14,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 80/17840 [08:19<30:52:33, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:20,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 80/17840 [08:19<30:52:33, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:20,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 80/17840 [08:19<30:52:33, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:20,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 81/17840 [08:25<30:30:25, 6.18s/it]g-point operations will not be computed-18 09:06:20,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 81/17840 [08:25<30:30:25, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:26,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:06:29,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:26,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:06:29,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:26,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 82/17840 [08:31<30:08:34, 6.11s/it]g-point operations will not be computed-18 09:06:26,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 82/17840 [08:31<30:08:34, 6.11s/it]g-point operations will not be computed-18 09:06:26,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:06:35,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:26,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:06:35,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:26,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 83/17840 [08:37<29:51:42, 6.05s/it]g-point operations will not be computed-18 09:06:26,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:06:39,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:26,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:06:39,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:26,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:06:39,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:26,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 84/17840 [08:43<29:23:30, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:44,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 84/17840 [08:43<29:23:30, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:44,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 84/17840 [08:43<29:23:30, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:44,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 84/17840 [08:43<29:23:30, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:44,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 85/17840 [08:49<29:00:58, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:49,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 85/17840 [08:49<29:00:58, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:06:49,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:06:53,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:49,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:06:53,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:49,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4799, 'learning_rate': 8.3e-06, 'epoch': 0.1} +[WARNING|modeling_utils.py:388] 2022-03-18 09:06:53,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:49,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:06:53,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:49,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:06:59,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:49,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:49,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:49,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:06:49,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 88/17840 [09:05<27:31:47, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:07:06,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 88/17840 [09:05<27:31:47, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:07:06,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:09,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:06,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:09,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:06,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:12,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:06,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:12,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:06,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:12,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:06,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 90/17840 [09:15<26:14:24, 5.32s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:18,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:18,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 91/17840 [09:20<25:19:57, 5.14s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:21,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:21,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:24,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:26,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:28,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:28,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:30,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:30,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:32,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:34,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:34,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:35,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:37,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:37,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:40,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:40,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:41,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:44,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:44,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:45,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:45,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:48,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:48,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:49,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:49,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:53,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:53,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:53,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:57,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:07:57,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:01,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:04,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:04,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3849, 'learning_rate': 9.900000000000002e-06, 'epoch': 0.11} +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:04,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:04,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:04,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 103/17840 [10:12<29:06:16, 5.91s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 103/17840 [10:12<29:06:16, 5.91s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 103/17840 [10:12<29:06:16, 5.91s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:19,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:19,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4163, 'learning_rate': 1.0100000000000002e-05, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:19,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:19,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [10:27<32:36:36, 6.62s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [10:27<32:36:36, 6.62s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2648, 'learning_rate': 1.02e-05, 'epoch': 0.12} + 1%|▍ | 105/17840 [10:27<32:36:36, 6.62s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:33,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:33,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.519, 'learning_rate': 1.03e-05, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:33,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:33,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 107/17840 [10:41<33:47:30, 6.86s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 107/17840 [10:41<33:47:30, 6.86s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5189, 'learning_rate': 1.04e-05, 'epoch': 0.12} + 1%|▍ | 107/17840 [10:41<33:47:30, 6.86s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:47,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:47,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6217, 'learning_rate': 1.05e-05, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:47,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:47,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:08:47,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 109/17840 [10:55<34:20:33, 6.97s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 109/17840 [10:55<34:20:33, 6.97s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:00,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 110/17840 [11:02<34:21:17, 6.98s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 110/17840 [11:02<34:21:17, 6.98s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.363, 'learning_rate': 1.0700000000000001e-05, 'epoch': 0.12} + 1%|▍ | 110/17840 [11:02<34:21:17, 6.98s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 110/17840 [11:02<34:21:17, 6.98s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 110/17840 [11:02<34:21:17, 6.98s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 111/17840 [11:09<34:13:01, 6.95s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:12,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:12,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [11:16<34:07:50, 6.93s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [11:16<34:07:50, 6.93s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3798, 'learning_rate': 1.09e-05, 'epoch': 0.13} + 1%|▍ | 112/17840 [11:16<34:07:50, 6.93s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:22,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:22,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3549, 'learning_rate': 1.1000000000000001e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:22,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:22,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 114/17840 [11:30<33:55:19, 6.89s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 114/17840 [11:30<33:55:19, 6.89s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:32,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:32,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 115/17840 [11:37<33:43:21, 6.85s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 115/17840 [11:37<33:43:21, 6.85s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3745, 'learning_rate': 1.1200000000000001e-05, 'epoch': 0.13} + 1%|▍ | 115/17840 [11:37<33:43:21, 6.85s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:42,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:42,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1432, 'learning_rate': 1.13e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:42,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:49,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:49,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:49,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4495, 'learning_rate': 1.1400000000000001e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:49,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 118/17840 [11:57<33:04:01, 6.72s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 118/17840 [11:57<33:04:01, 6.72s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:59,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:09:59,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 119/17840 [12:03<32:48:58, 6.67s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 119/17840 [12:03<32:48:58, 6.67s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.499, 'learning_rate': 1.16e-05, 'epoch': 0.13} + 1%|▌ | 119/17840 [12:03<32:48:58, 6.67s/it]g-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:09,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:09,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5266, 'learning_rate': 1.1700000000000001e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:09,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:15,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:15,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4672, 'learning_rate': 1.18e-05, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:15,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:15,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:07:16,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 122/17840 [12:23<32:16:55, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:10:24,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 122/17840 [12:23<32:16:55, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:10:24,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3615, 'learning_rate': 1.19e-05, 'epoch': 0.14} + 1%|▌ | 122/17840 [12:23<32:16:55, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:10:24,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 123/17840 [12:29<32:06:12, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:10:24,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 123/17840 [12:29<32:06:12, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:10:24,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:32,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:24,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:32,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:24,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:32,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:24,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 124/17840 [12:35<31:52:57, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 124/17840 [12:35<31:52:57, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 124/17840 [12:35<31:52:57, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 124/17840 [12:35<31:52:57, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 125/17840 [12:42<32:21:13, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 125/17840 [12:42<32:21:13, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:46,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:46,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 126/17840 [12:49<31:58:46, 6.50s/it]g-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 126/17840 [12:49<31:58:46, 6.50s/it]g-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:52,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:52,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 127/17840 [12:55<31:35:33, 6.42s/it]g-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 127/17840 [12:55<31:35:33, 6.42s/it]g-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:59,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:10:59,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 128/17840 [13:01<31:10:16, 6.34s/it]g-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 128/17840 [13:01<31:10:16, 6.34s/it]g-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:05,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:05,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 129/17840 [13:07<30:50:57, 6.27s/it]g-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 129/17840 [13:07<30:50:57, 6.27s/it]g-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:11,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:11,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 130/17840 [13:13<30:27:13, 6.19s/it]g-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 130/17840 [13:13<30:27:13, 6.19s/it]g-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:17,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:17,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 131/17840 [13:19<30:09:01, 6.13s/it]g-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:21,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:21,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:21,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 132/17840 [13:25<29:50:16, 6.07s/it]g-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:27,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:27,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:27,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:10:36,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 133/17840 [13:31<29:28:18, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:11:32,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 133/17840 [13:31<29:28:18, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:11:32,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:36,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:11:32,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:36,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:11:32,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4808, 'learning_rate': 1.3100000000000002e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:36,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:11:32,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:41,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:11:32,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:41,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:11:32,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3239, 'learning_rate': 1.32e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:45,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:11:32,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 136/17840 [13:48<28:05:18, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:11:48,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 136/17840 [13:48<28:05:18, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:11:48,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3337, 'learning_rate': 1.3300000000000001e-05, 'epoch': 0.15} + 1%|▌ | 136/17840 [13:48<28:05:18, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:11:48,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 136/17840 [13:48<28:05:18, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:11:48,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 137/17840 [13:53<27:35:58, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:11:54,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 137/17840 [13:53<27:35:58, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:11:54,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:57,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:11:54,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:11:57,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:11:54,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:00,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:11:54,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:00,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:11:54,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:00,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:11:54,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 139/17840 [14:03<26:24:48, 5.37s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:06,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 140/17840 [14:08<25:34:58, 5.20s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 140/17840 [14:08<25:34:58, 5.20s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:10,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:14,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:16,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:16,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:18,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:20,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:20,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:22,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:23,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:23,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:27,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:27,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:28,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:30,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:30,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:32,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:32,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:34,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:34,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:36,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:36,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:38,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:40,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:40,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3485, 'learning_rate': 1.47e-05, 'epoch': 0.17} +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:44,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:44,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:47,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:47,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:51,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:51,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:55,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:55,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3669, 'learning_rate': 1.49e-05, 'epoch': 0.17} +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:59,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:12:59,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 153/17840 [15:03<28:27:45, 5.79s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 153/17840 [15:03<28:27:45, 5.79s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4344, 'learning_rate': 1.5e-05, 'epoch': 0.17} + 1%|▋ | 153/17840 [15:03<28:27:45, 5.79s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 153/17840 [15:03<28:27:45, 5.79s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:09,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:09,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:09,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:09,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:09,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 155/17840 [15:17<32:01:27, 6.52s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 155/17840 [15:17<32:01:27, 6.52s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:22,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [15:24<32:54:44, 6.70s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [15:24<32:54:44, 6.70s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2929, 'learning_rate': 1.53e-05, 'epoch': 0.17} + 1%|▋ | 156/17840 [15:24<32:54:44, 6.70s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [15:24<32:54:44, 6.70s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [15:24<32:54:44, 6.70s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 157/17840 [15:31<33:27:21, 6.81s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:34,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:34,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:34,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [15:39<33:52:50, 6.90s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [15:39<33:52:50, 6.90s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [15:39<33:52:50, 6.90s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:45,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:45,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6063, 'learning_rate': 1.56e-05, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:45,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:45,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:45,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [15:53<34:06:07, 6.94s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [15:53<34:06:07, 6.94s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [15:53<34:06:07, 6.94s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [15:53<34:06:07, 6.94s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:59,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:59,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:59,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:59,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:13:59,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 162/17840 [16:06<33:52:41, 6.90s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:14:09,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:14:09,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:14:09,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 163/17840 [16:13<33:46:09, 6.88s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 163/17840 [16:13<33:46:09, 6.88s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:14:17,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 164/17840 [16:20<33:39:55, 6.86s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 164/17840 [16:20<33:39:55, 6.86s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4848, 'learning_rate': 1.6100000000000002e-05, 'epoch': 0.18} + 1%|▋ | 164/17840 [16:20<33:39:55, 6.86s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 164/17840 [16:20<33:39:55, 6.86s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 164/17840 [16:20<33:39:55, 6.86s/it]g-point operations will not be computed-18 09:12:04,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 165/17840 [16:27<33:29:57, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 165/17840 [16:27<33:29:57, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 165/17840 [16:27<33:29:57, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 165/17840 [16:27<33:29:57, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 166/17840 [16:33<33:18:06, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 166/17840 [16:33<33:18:06, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:14:38,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:14:38,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 167/17840 [16:40<33:06:19, 6.74s/it]g-point operations will not be computed-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 167/17840 [16:40<33:06:19, 6.74s/it]g-point operations will not be computed-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 167/17840 [16:40<33:06:19, 6.74s/it]g-point operations will not be computed-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:14:46,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:14:46,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1642, 'learning_rate': 1.65e-05, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-18 09:14:46,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:14:52,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:14:52,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.179, 'learning_rate': 1.66e-05, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-18 09:14:52,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:14:52,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:14:52,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:14:28,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 170/17840 [17:00<32:24:37, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 170/17840 [17:00<32:24:37, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 170/17840 [17:00<32:24:37, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 170/17840 [17:00<32:24:37, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 171/17840 [17:06<32:09:50, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 171/17840 [17:06<32:09:50, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:15:10,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:15:10,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 172/17840 [17:13<32:03:00, 6.53s/it]g-point operations will not be computed-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 172/17840 [17:13<32:03:00, 6.53s/it]g-point operations will not be computed-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:15:17,056 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 173/17840 [17:19<31:50:23, 6.49s/it]g-point operations will not be computed-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 173/17840 [17:19<31:50:23, 6.49s/it]g-point operations will not be computed-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4037, 'learning_rate': 1.7000000000000003e-05, 'epoch': 0.19} + 1%|▋ | 173/17840 [17:19<31:50:23, 6.49s/it]g-point operations will not be computed-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:15:24,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:15:24,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2218, 'learning_rate': 1.7100000000000002e-05, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-18 09:15:24,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:15:24,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:15:24,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:00,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 175/17840 [17:32<32:06:30, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:33,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 175/17840 [17:32<32:06:30, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:33,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 175/17840 [17:32<32:06:30, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:33,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 175/17840 [17:32<32:06:30, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:33,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 176/17840 [17:38<31:50:27, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:33,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:15:41,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:33,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:15:41,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:33,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:15:41,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:33,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 177/17840 [17:45<31:22:07, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:45,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 177/17840 [17:45<31:22:07, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:45,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 177/17840 [17:45<31:22:07, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:45,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 177/17840 [17:45<31:22:07, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:45,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 178/17840 [17:51<31:02:23, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:45,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:15:53,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:45,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:15:53,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:45,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:15:53,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:45,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 179/17840 [17:57<30:45:31, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:58,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 179/17840 [17:57<30:45:31, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:58,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 179/17840 [17:57<30:45:31, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:58,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 179/17840 [17:57<30:45:31, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:58,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 180/17840 [18:03<30:27:35, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:15:58,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:05,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:58,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:05,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:58,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:05,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:15:58,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 181/17840 [18:09<30:04:08, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:16:10,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 181/17840 [18:09<30:04:08, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:16:10,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 181/17840 [18:09<30:04:08, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:16:10,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 181/17840 [18:09<30:04:08, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:16:10,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 182/17840 [18:15<29:43:51, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:16:15,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 182/17840 [18:15<29:43:51, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:16:15,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:20,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:15,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:20,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:15,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4535, 'learning_rate': 1.8e-05, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:24,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:15,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 184/17840 [18:26<28:49:24, 5.88s/it]g-point operations will not be computed-18 09:16:15,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 184/17840 [18:26<28:49:24, 5.88s/it]g-point operations will not be computed-18 09:16:15,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:28,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:15,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:28,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:15,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 185/17840 [18:32<28:20:26, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:16:32,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 185/17840 [18:32<28:20:26, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:16:32,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4215, 'learning_rate': 1.8200000000000002e-05, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:36,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:32,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:36,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:32,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3083, 'learning_rate': 1.83e-05, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:40,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:32,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 187/17840 [18:43<27:23:37, 5.59s/it]g-point operations will not be computed-18 09:16:32,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 187/17840 [18:43<27:23:37, 5.59s/it]g-point operations will not be computed-18 09:16:32,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:45,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:32,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:45,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:32,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:45,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:32,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 188/17840 [18:48<26:56:14, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:16:48,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 188/17840 [18:48<26:56:14, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:16:48,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:52,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:48,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:52,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:48,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3384, 'learning_rate': 1.86e-05, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-18 09:16:56,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:48,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 190/17840 [18:58<25:46:19, 5.26s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 190/17840 [18:58<25:46:19, 5.26s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.445, 'learning_rate': 1.87e-05, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:02,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:02,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:04,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:06,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:06,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:08,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:11,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:11,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:13,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:14,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:14,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:16,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:21,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:21,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:23,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:24,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:24,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:26,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:26,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:29,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:29,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:31,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:31,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7835, 'learning_rate': 1.97e-05, 'epoch': 0.22} +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:35,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:35,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:39,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:39,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1689, 'learning_rate': 1.9800000000000004e-05, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:42,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:42,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:46,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:46,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3166, 'learning_rate': 1.9900000000000003e-05, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:46,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:54,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:54,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2096, 'learning_rate': 2e-05, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:54,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:54,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:17:54,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 204/17840 [20:02<30:43:33, 6.27s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 204/17840 [20:02<30:43:33, 6.27s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 204/17840 [20:02<30:43:33, 6.27s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:18:08,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:18:08,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1205, 'learning_rate': 2.0200000000000003e-05, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-18 09:18:08,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:18:08,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:18:08,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 206/17840 [20:16<32:53:56, 6.72s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 206/17840 [20:16<32:53:56, 6.72s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:18:20,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 207/17840 [20:23<33:22:01, 6.81s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 207/17840 [20:23<33:22:01, 6.81s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.252, 'learning_rate': 2.04e-05, 'epoch': 0.23} + 1%|▉ | 207/17840 [20:23<33:22:01, 6.81s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 207/17840 [20:23<33:22:01, 6.81s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 207/17840 [20:23<33:22:01, 6.81s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 208/17840 [20:30<33:40:18, 6.87s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:18:33,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:18:33,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:18:33,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 209/17840 [20:37<33:45:30, 6.89s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 209/17840 [20:37<33:45:30, 6.89s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 209/17840 [20:37<33:45:30, 6.89s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 209/17840 [20:37<33:45:30, 6.89s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 209/17840 [20:37<33:45:30, 6.89s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 210/17840 [20:44<33:47:20, 6.90s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:18:46,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:18:46,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:18:46,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 211/17840 [20:51<33:40:06, 6.88s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 211/17840 [20:51<33:40:06, 6.88s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:18:55,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3207, 'learning_rate': 2.09e-05, 'epoch': 0.24} + g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 213/17840 [21:04<33:29:30, 6.84s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:07,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:07,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:07,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 214/17840 [21:11<33:23:09, 6.82s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 214/17840 [21:11<33:23:09, 6.82s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 214/17840 [21:11<33:23:09, 6.82s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 214/17840 [21:11<33:23:09, 6.82s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:17,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:17,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:17,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:23,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:23,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3812, 'learning_rate': 2.13e-05, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:23,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:23,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:23,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 217/17840 [21:31<33:01:14, 6.75s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 217/17840 [21:31<33:01:14, 6.75s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:35,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:35,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 218/17840 [21:38<32:53:53, 6.72s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 218/17840 [21:38<32:53:53, 6.72s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 218/17840 [21:38<32:53:53, 6.72s/it]g-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:43,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:43,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3362, 'learning_rate': 2.16e-05, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:43,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:43,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:19:43,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:16:58,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 220/17840 [21:51<32:20:11, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 220/17840 [21:51<32:20:11, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 220/17840 [21:51<32:20:11, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 220/17840 [21:51<32:20:11, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 221/17840 [21:57<32:08:51, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:00,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:00,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:00,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 222/17840 [22:04<32:02:43, 6.55s/it]g-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 222/17840 [22:04<32:02:43, 6.55s/it]g-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:08,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:08,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 223/17840 [22:10<31:57:47, 6.53s/it]g-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 223/17840 [22:10<31:57:47, 6.53s/it]g-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:14,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 224/17840 [22:17<31:42:55, 6.48s/it]g-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 224/17840 [22:17<31:42:55, 6.48s/it]g-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3063, 'learning_rate': 2.2100000000000002e-05, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:20,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 225/17840 [22:23<32:07:08, 6.56s/it]g-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 225/17840 [22:23<32:07:08, 6.56s/it]g-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4005, 'learning_rate': 2.22e-05, 'epoch': 0.25} + 1%|▉ | 225/17840 [22:23<32:07:08, 6.56s/it]g-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 225/17840 [22:23<32:07:08, 6.56s/it]g-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 225/17840 [22:23<32:07:08, 6.56s/it]g-point operations will not be computed-18 09:19:52,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 226/17840 [22:30<31:42:45, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:20:30,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 226/17840 [22:30<31:42:45, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:20:30,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 226/17840 [22:30<31:42:45, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:20:30,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 226/17840 [22:30<31:42:45, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:20:30,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 227/17840 [22:36<31:14:12, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:20:37,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 227/17840 [22:36<31:14:12, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:20:37,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 227/17840 [22:36<31:14:12, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:20:37,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 227/17840 [22:36<31:14:12, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:20:37,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 228/17840 [22:42<30:52:31, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 228/17840 [22:42<30:52:31, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:47,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:47,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2616, 'learning_rate': 2.26e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:47,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:53,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:53,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2935, 'learning_rate': 2.2700000000000003e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:53,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:59,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:59,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2881, 'learning_rate': 2.2800000000000002e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-18 09:20:59,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:05,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:05,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3952, 'learning_rate': 2.29e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:05,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:11,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:11,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:14,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:14,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 234/17840 [23:17<28:53:58, 5.91s/it]g-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 234/17840 [23:17<28:53:58, 5.91s/it]g-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:19,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:19,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:19,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:20:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 235/17840 [23:23<28:25:40, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:21:24,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 235/17840 [23:23<28:25:40, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:21:24,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:28,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:24,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:28,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:24,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3103, 'learning_rate': 2.3300000000000004e-05, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:32,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:24,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 237/17840 [23:34<27:29:02, 5.62s/it]g-point operations will not be computed-18 09:21:24,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 237/17840 [23:34<27:29:02, 5.62s/it]g-point operations will not be computed-18 09:21:24,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:36,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:24,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:36,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:24,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:36,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:24,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 238/17840 [23:39<26:54:40, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:21:40,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:42,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:40,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 239/17840 [23:44<26:25:18, 5.40s/it]g-point operations will not be computed-18 09:21:40,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 239/17840 [23:44<26:25:18, 5.40s/it]g-point operations will not be computed-18 09:21:40,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:46,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:40,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:46,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:40,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:46,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:40,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 240/17840 [23:49<25:47:47, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:21:50,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:52,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:50,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 241/17840 [23:54<25:01:41, 5.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 241/17840 [23:54<25:01:41, 5.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4249, 'learning_rate': 2.38e-05, 'epoch': 0.27} +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:58,054 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:21:58,054 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:00,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:02,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:02,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:03,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:05,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:05,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:07,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:07,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:10,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:15,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:15,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:16,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:18,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:18,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:20,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:20,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:22,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:22,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.313, 'learning_rate': 2.47e-05, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:26,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:26,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:30,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:30,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4865, 'learning_rate': 2.48e-05, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:33,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:37,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:37,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2066, 'learning_rate': 2.4900000000000002e-05, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:41,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:22:41,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 253/17840 [24:45<28:17:39, 5.79s/it]g-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 253/17840 [24:45<28:17:39, 5.79s/it]g-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1992, 'learning_rate': 2.5e-05, 'epoch': 0.28} + 1%|█ | 253/17840 [24:45<28:17:39, 5.79s/it]g-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 253/17840 [24:45<28:17:39, 5.79s/it]g-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 253/17840 [24:45<28:17:39, 5.79s/it]g-point operations will not be computed-18 09:21:54,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 254/17840 [24:52<30:17:30, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:22:53,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 254/17840 [24:52<30:17:30, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:22:53,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 254/17840 [24:52<30:17:30, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:22:53,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 255/17840 [24:59<31:41:13, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:22:53,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 255/17840 [24:59<31:41:13, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:22:53,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2331, 'learning_rate': 2.5200000000000003e-05, 'epoch': 0.29} + 1%|█ | 255/17840 [24:59<31:41:13, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:22:53,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 255/17840 [24:59<31:41:13, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:22:53,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 255/17840 [24:59<31:41:13, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:22:53,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 256/17840 [25:06<32:33:21, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 256/17840 [25:06<32:33:21, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 256/17840 [25:06<32:33:21, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 256/17840 [25:06<32:33:21, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 257/17840 [25:13<33:01:44, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 257/17840 [25:13<33:01:44, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 257/17840 [25:13<33:01:44, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 257/17840 [25:13<33:01:44, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:20,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:20,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:20,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:20,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:20,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 259/17840 [25:27<33:35:23, 6.88s/it]g-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:30,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:30,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:30,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [25:34<33:38:44, 6.89s/it]g-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [25:34<33:38:44, 6.89s/it]g-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [25:34<33:38:44, 6.89s/it]g-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:40,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:40,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4041, 'learning_rate': 2.58e-05, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:40,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:40,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:40,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 262/17840 [25:48<33:24:38, 6.84s/it]g-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:50,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:50,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:23:50,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 263/17840 [25:55<33:18:48, 6.82s/it]g-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 263/17840 [25:55<33:18:48, 6.82s/it]g-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 263/17840 [25:55<33:18:48, 6.82s/it]g-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:01,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:01,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2113, 'learning_rate': 2.61e-05, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:01,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:07,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:07,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3241, 'learning_rate': 2.6200000000000003e-05, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:07,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:07,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:07,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 266/17840 [26:15<32:53:44, 6.74s/it]g-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 266/17840 [26:15<32:53:44, 6.74s/it]g-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:19,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:19,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 267/17840 [26:21<32:40:32, 6.69s/it]g-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 267/17840 [26:21<32:40:32, 6.69s/it]g-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 267/17840 [26:21<32:40:32, 6.69s/it]g-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:27,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:27,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5262, 'learning_rate': 2.6500000000000004e-05, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:27,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:27,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:27,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:23:07,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [26:34<32:27:15, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [26:34<32:27:15, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [26:34<32:27:15, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [26:34<32:27:15, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 270/17840 [26:41<32:22:51, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:44,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:44,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:44,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 271/17840 [26:48<32:09:30, 6.59s/it]g-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:50,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:50,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 272/17840 [26:54<31:57:10, 6.55s/it]g-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 272/17840 [26:54<31:57:10, 6.55s/it]g-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.217, 'learning_rate': 2.6900000000000003e-05, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-18 09:24:58,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 273/17840 [27:00<31:45:24, 6.51s/it]g-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 273/17840 [27:00<31:45:24, 6.51s/it]g-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2217, 'learning_rate': 2.7000000000000002e-05, 'epoch': 0.31} + 2%|█▏ | 273/17840 [27:00<31:45:24, 6.51s/it]g-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:06,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:06,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1867, 'learning_rate': 2.7100000000000005e-05, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:06,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:06,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:06,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:24:35,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 275/17840 [27:14<32:06:45, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 275/17840 [27:14<32:06:45, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 275/17840 [27:14<32:06:45, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 275/17840 [27:14<32:06:45, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 276/17840 [27:20<31:40:12, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:22,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:22,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:22,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 277/17840 [27:26<31:21:52, 6.43s/it]g-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:29,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:29,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:29,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 278/17840 [27:32<31:02:34, 6.36s/it]g-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:35,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:35,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:35,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 279/17840 [27:39<30:44:36, 6.30s/it]g-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:41,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:41,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:41,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 280/17840 [27:45<30:22:13, 6.23s/it]g-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:47,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:47,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:47,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 281/17840 [27:51<30:06:13, 6.17s/it]g-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:53,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:53,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:25:53,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:15,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 282/17840 [27:57<29:43:49, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 282/17840 [27:57<29:43:49, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:02,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:02,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0814, 'learning_rate': 2.8000000000000003e-05, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:06,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 284/17840 [28:08<28:41:31, 5.88s/it]g-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 284/17840 [28:08<28:41:31, 5.88s/it]g-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:10,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:10,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 285/17840 [28:14<28:12:15, 5.78s/it]g-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 285/17840 [28:14<28:12:15, 5.78s/it]g-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:16,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:18,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:18,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2779, 'learning_rate': 2.83e-05, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:22,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 287/17840 [28:24<27:05:19, 5.56s/it]g-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 287/17840 [28:24<27:05:19, 5.56s/it]g-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:26,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:26,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:25:57,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 288/17840 [28:29<26:29:13, 5.43s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:26:30,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 288/17840 [28:29<26:29:13, 5.43s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:26:30,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:32,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:26:30,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 289/17840 [28:34<25:47:15, 5.29s/it]g-point operations will not be computed-18 09:26:30,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 289/17840 [28:34<25:47:15, 5.29s/it]g-point operations will not be computed-18 09:26:30,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:36,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:26:30,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:38,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:26:30,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:38,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:26:30,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3931, 'learning_rate': 2.87e-05, 'epoch': 0.33} + 2%|█▏ | 291/17840 [28:44<23:59:29, 4.92s/it]g-point operations will not be computed-18 09:26:30,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 291/17840 [28:44<23:59:29, 4.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:26:44,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 291/17840 [28:44<23:59:29, 4.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:26:44,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:26:46,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:26:44,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 292/17840 [28:48<22:58:49, 4.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:26:48,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 292/17840 [28:48<22:58:49, 4.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:26:48,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 293/17840 [28:52<21:54:06, 4.49s/it]g-point operations will not be computed-18 09:26:48,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 293/17840 [28:52<21:54:06, 4.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:26:52,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 293/17840 [28:52<21:54:06, 4.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:26:52,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 294/17840 [28:55<20:41:14, 4.24s/it]g-point operations will not be computed-18 09:26:52,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 294/17840 [28:55<20:41:14, 4.24s/it]g-point operations will not be computed-18 09:26:52,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 294/17840 [28:55<20:41:14, 4.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:26:56,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 294/17840 [28:55<20:41:14, 4.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:26:56,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 295/17840 [28:59<19:38:25, 4.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:26:59,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 296/17840 [29:02<18:08:30, 3.72s/it]g-point operations will not be computed-18 09:26:59,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 296/17840 [29:02<18:08:30, 3.72s/it]g-point operations will not be computed-18 09:26:59,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:27:03,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:27:02,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:27:03,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:27:02,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 297/17840 [29:05<16:35:57, 3.41s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:27:05,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 297/17840 [29:05<16:35:57, 3.41s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:27:05,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 298/17840 [29:07<15:11:21, 3.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:27:07,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 298/17840 [29:07<15:11:21, 3.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:27:07,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 299/17840 [29:09<13:45:19, 2.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:27:09,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 300/17840 [29:12<13:09:13, 2.70s/it]g-point operations will not be computed-18 09:27:09,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 300/17840 [29:12<13:09:13, 2.70s/it]g-point operations will not be computed-18 09:27:09,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 300/17840 [29:12<13:09:13, 2.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:27:13,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 300/17840 [29:12<13:09:13, 2.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:27:13,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:27:17,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:27:13,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 301/17840 [29:19<20:34:12, 4.22s/it]g-point operations will not be computed-18 09:27:13,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 301/17840 [29:19<20:34:12, 4.22s/it]g-point operations will not be computed-18 09:27:13,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 301/17840 [29:19<20:34:12, 4.22s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:27:21,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 301/17840 [29:19<20:34:12, 4.22s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:27:21,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:27:24,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:27:21,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [29:27<25:05:08, 5.15s/it]g-point operations will not be computed-18 09:27:21,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [29:27<25:05:08, 5.15s/it]g-point operations will not be computed-18 09:27:21,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [29:27<25:05:08, 5.15s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [29:27<25:05:08, 5.15s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:27:33,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:27:33,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:27:33,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2136, 'learning_rate': 3e-05, 'epoch': 0.34} +[WARNING|modeling_utils.py:388] 2022-03-18 09:27:33,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [29:41<30:29:36, 6.26s/it]g-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [29:41<30:29:36, 6.26s/it]g-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3225, 'learning_rate': 3.01e-05, 'epoch': 0.34} + 2%|█▎ | 304/17840 [29:41<30:29:36, 6.26s/it]g-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [29:41<30:29:36, 6.26s/it]g-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 305/17840 [29:48<31:40:27, 6.50s/it]g-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 305/17840 [29:48<31:40:27, 6.50s/it]g-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:27:51,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:27:51,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [29:56<32:36:13, 6.69s/it]g-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [29:56<32:36:13, 6.69s/it]g-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2248, 'learning_rate': 3.03e-05, 'epoch': 0.34} + 2%|█▎ | 306/17840 [29:56<32:36:13, 6.69s/it]g-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [29:56<32:36:13, 6.69s/it]g-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 306/17840 [29:56<32:36:13, 6.69s/it]g-point operations will not be computed-18 09:27:28,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 307/17840 [30:03<33:08:57, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 307/17840 [30:03<33:08:57, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 307/17840 [30:03<33:08:57, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 307/17840 [30:03<33:08:57, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 308/17840 [30:10<33:28:20, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 308/17840 [30:10<33:28:20, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:28:14,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:28:14,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 309/17840 [30:17<33:30:54, 6.88s/it]g-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 309/17840 [30:17<33:30:54, 6.88s/it]g-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 309/17840 [30:17<33:30:54, 6.88s/it]g-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 309/17840 [30:17<33:30:54, 6.88s/it]g-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 309/17840 [30:17<33:30:54, 6.88s/it]g-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 310/17840 [30:24<33:36:06, 6.90s/it]g-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:28:26,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:28:26,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:28:26,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 311/17840 [30:30<33:27:00, 6.87s/it]g-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 311/17840 [30:30<33:27:00, 6.87s/it]g-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 311/17840 [30:30<33:27:00, 6.87s/it]g-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 311/17840 [30:30<33:27:00, 6.87s/it]g-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:28:36,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:28:36,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:28:36,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:28:36,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:28:36,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:04,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 313/17840 [30:44<33:17:07, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 313/17840 [30:44<33:17:07, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 313/17840 [30:44<33:17:07, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 313/17840 [30:44<33:17:07, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 314/17840 [30:51<33:05:24, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:28:53,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:28:53,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:28:53,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 315/17840 [30:57<32:54:25, 6.76s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 315/17840 [30:57<32:54:25, 6.76s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 315/17840 [30:57<32:54:25, 6.76s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:03,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:03,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.33, 'learning_rate': 3.13e-05, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:03,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:10,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:10,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2049, 'learning_rate': 3.1400000000000004e-05, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:10,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:10,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:10,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 318/17840 [31:17<32:25:59, 6.66s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:20,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:20,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:20,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 319/17840 [31:24<32:17:34, 6.64s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 319/17840 [31:24<32:17:34, 6.64s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:28,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:28,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 320/17840 [31:30<32:02:06, 6.58s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 320/17840 [31:30<32:02:06, 6.58s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 320/17840 [31:30<32:02:06, 6.58s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:36,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:36,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3573, 'learning_rate': 3.18e-05, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:36,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:42,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:42,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2707, 'learning_rate': 3.19e-05, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:42,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:49,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:49,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1503, 'learning_rate': 3.2000000000000005e-05, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:49,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:49,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:49,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 324/17840 [31:56<31:23:31, 6.45s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:29:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 325/17840 [32:03<31:52:10, 6.55s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 325/17840 [32:03<31:52:10, 6.55s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.385, 'learning_rate': 3.2200000000000003e-05, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-18 09:30:07,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 326/17840 [32:09<31:30:30, 6.48s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 326/17840 [32:09<31:30:30, 6.48s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3805, 'learning_rate': 3.2300000000000006e-05, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-18 09:30:13,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 327/17840 [32:15<31:08:04, 6.40s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 327/17840 [32:15<31:08:04, 6.40s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2399, 'learning_rate': 3.24e-05, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-18 09:30:19,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 328/17840 [32:21<30:40:17, 6.31s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 328/17840 [32:21<30:40:17, 6.31s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.227, 'learning_rate': 3.2500000000000004e-05, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-18 09:30:25,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 329/17840 [32:27<30:24:36, 6.25s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 329/17840 [32:27<30:24:36, 6.25s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4373, 'learning_rate': 3.26e-05, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-18 09:30:31,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 330/17840 [32:33<30:01:59, 6.17s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 330/17840 [32:33<30:01:59, 6.17s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4642, 'learning_rate': 3.27e-05, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-18 09:30:37,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 331/17840 [32:39<29:38:52, 6.10s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 331/17840 [32:39<29:38:52, 6.10s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2793, 'learning_rate': 3.2800000000000004e-05, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-18 09:30:43,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:30:43,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 332/17840 [32:45<29:17:29, 6.02s/it]g-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:30:47,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:30:47,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:30:47,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:28:45,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 333/17840 [32:51<28:54:15, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:30:52,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 333/17840 [32:51<28:54:15, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:30:52,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:30:56,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:30:52,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:30:56,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:30:52,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3524, 'learning_rate': 3.3100000000000005e-05, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-18 09:30:56,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:30:52,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:01,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:30:52,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:01,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:30:52,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4801, 'learning_rate': 3.32e-05, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:06,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:30:52,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:06,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:30:52,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 336/17840 [33:08<27:39:07, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 336/17840 [33:08<27:39:07, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:12,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:12,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1642, 'learning_rate': 3.3400000000000005e-05, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:16,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 338/17840 [33:18<26:41:27, 5.49s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 338/17840 [33:18<26:41:27, 5.49s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:20,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:23,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:23,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2199, 'learning_rate': 3.3600000000000004e-05, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:26,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 340/17840 [33:28<25:22:39, 5.22s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 340/17840 [33:28<25:22:39, 5.22s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:30,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:32,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:32,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:34,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:36,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:36,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:39,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:41,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:41,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:43,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:44,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:44,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:46,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:48,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:48,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:51,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:51,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:52,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:54,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:54,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:56,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:56,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:59,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:31:59,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:01,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:01,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5474, 'learning_rate': 3.4699999999999996e-05, 'epoch': 0.39} +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:01,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:05,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:09,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:09,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2565, 'learning_rate': 3.48e-05, 'epoch': 0.39} +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:13,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:13,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:16,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:16,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3299, 'learning_rate': 3.49e-05, 'epoch': 0.39} +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:16,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:16,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 353/17840 [34:25<28:54:00, 5.95s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 353/17840 [34:25<28:54:00, 5.95s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2378, 'learning_rate': 3.5e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:29,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 354/17840 [34:32<30:49:27, 6.35s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 354/17840 [34:32<30:49:27, 6.35s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2547, 'learning_rate': 3.51e-05, 'epoch': 0.4} + 2%|█▌ | 354/17840 [34:32<30:49:27, 6.35s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 354/17840 [34:32<30:49:27, 6.35s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 355/17840 [34:39<32:10:04, 6.62s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 355/17840 [34:39<32:10:04, 6.62s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4107, 'learning_rate': 3.52e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:44,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 356/17840 [34:46<32:55:47, 6.78s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 356/17840 [34:46<32:55:47, 6.78s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1386, 'learning_rate': 3.53e-05, 'epoch': 0.4} + 2%|█▌ | 356/17840 [34:46<32:55:47, 6.78s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 356/17840 [34:46<32:55:47, 6.78s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 357/17840 [34:54<33:27:47, 6.89s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 357/17840 [34:54<33:27:47, 6.89s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1969, 'learning_rate': 3.54e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:58,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:32:58,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 358/17840 [35:01<33:52:05, 6.97s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 358/17840 [35:01<33:52:05, 6.97s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 358/17840 [35:01<33:52:05, 6.97s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 358/17840 [35:01<33:52:05, 6.97s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 358/17840 [35:01<33:52:05, 6.97s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 359/17840 [35:08<34:08:40, 7.03s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 359/17840 [35:08<34:08:40, 7.03s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:33:12,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:33:12,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 360/17840 [35:15<34:05:13, 7.02s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 360/17840 [35:15<34:05:13, 7.02s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 360/17840 [35:15<34:05:13, 7.02s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 360/17840 [35:15<34:05:13, 7.02s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 360/17840 [35:15<34:05:13, 7.02s/it]g-point operations will not be computed-18 09:31:08,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 361/17840 [35:22<33:58:47, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 361/17840 [35:22<33:58:47, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 361/17840 [35:22<33:58:47, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 361/17840 [35:22<33:58:47, 7.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 362/17840 [35:29<33:43:05, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 362/17840 [35:29<33:43:05, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 362/17840 [35:29<33:43:05, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 362/17840 [35:29<33:43:05, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:33:35,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:33:35,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:33:35,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:33:35,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:33:35,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 364/17840 [35:42<33:25:35, 6.89s/it]g-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:33:45,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:33:45,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:33:45,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 365/17840 [35:49<33:08:46, 6.83s/it]g-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 365/17840 [35:49<33:08:46, 6.83s/it]g-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:33:53,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:33:53,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 366/17840 [35:56<32:58:46, 6.79s/it]g-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 366/17840 [35:56<32:58:46, 6.79s/it]g-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 366/17840 [35:56<32:58:46, 6.79s/it]g-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 366/17840 [35:56<32:58:46, 6.79s/it]g-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 366/17840 [35:56<32:58:46, 6.79s/it]g-point operations will not be computed-18 09:33:23,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 367/17840 [36:02<32:50:22, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 367/17840 [36:02<32:50:22, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 367/17840 [36:02<32:50:22, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 367/17840 [36:02<32:50:22, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 368/17840 [36:09<32:39:13, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:34:12,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:34:12,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:34:12,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 369/17840 [36:16<32:29:40, 6.70s/it]g-point operations will not be computed-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:34:18,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:34:18,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:34:18,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 370/17840 [36:22<32:23:46, 6.68s/it]g-point operations will not be computed-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 370/17840 [36:22<32:23:46, 6.68s/it]g-point operations will not be computed-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 370/17840 [36:22<32:23:46, 6.68s/it]g-point operations will not be computed-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 370/17840 [36:22<32:23:46, 6.68s/it]g-point operations will not be computed-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 370/17840 [36:22<32:23:46, 6.68s/it]g-point operations will not be computed-18 09:34:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [36:29<32:19:21, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:30,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [36:29<32:19:21, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:30,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [36:29<32:19:21, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:30,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [36:29<32:19:21, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:30,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 372/17840 [36:36<32:10:34, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 372/17840 [36:36<32:10:34, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 372/17840 [36:36<32:10:34, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 372/17840 [36:36<32:10:34, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 373/17840 [36:42<31:53:20, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 373/17840 [36:42<31:53:20, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:34:46,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:34:46,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 374/17840 [36:48<31:26:33, 6.48s/it]g-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 374/17840 [36:48<31:26:33, 6.48s/it]g-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:34:52,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 375/17840 [36:55<31:54:25, 6.58s/it]g-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 375/17840 [36:55<31:54:25, 6.58s/it]g-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1942, 'learning_rate': 3.72e-05, 'epoch': 0.42} + 2%|█▌ | 375/17840 [36:55<31:54:25, 6.58s/it]g-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:01,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:01,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3037, 'learning_rate': 3.73e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:01,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:07,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:07,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0917, 'learning_rate': 3.74e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:07,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3677, 'learning_rate': 3.7500000000000003e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:13,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:19,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:19,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2856, 'learning_rate': 3.76e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:19,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:25,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:25,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4101, 'learning_rate': 3.77e-05, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:30,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 381/17840 [37:32<29:51:28, 6.16s/it]g-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 381/17840 [37:32<29:51:28, 6.16s/it]g-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3754, 'learning_rate': 3.7800000000000004e-05, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:36,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 382/17840 [37:38<29:29:29, 6.08s/it]g-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 382/17840 [37:38<29:29:29, 6.08s/it]g-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2856, 'learning_rate': 3.79e-05, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:42,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 383/17840 [37:44<29:11:21, 6.02s/it]g-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 383/17840 [37:44<29:11:21, 6.02s/it]g-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:46,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:46,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:46,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:34:36,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 384/17840 [37:50<28:36:02, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:35:50,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 384/17840 [37:50<28:36:02, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:35:50,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:54,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:35:50,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:54,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:35:50,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.206, 'learning_rate': 3.82e-05, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-18 09:35:59,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:35:50,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 386/17840 [38:01<27:43:51, 5.72s/it]g-point operations will not be computed-18 09:35:50,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 386/17840 [38:01<27:43:51, 5.72s/it]g-point operations will not be computed-18 09:35:50,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:03,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:35:50,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:03,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:35:50,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:03,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:35:50,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 387/17840 [38:06<27:07:39, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:36:07,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 387/17840 [38:06<27:07:39, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:36:07,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:10,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:07,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:10,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:07,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:13,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:07,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:13,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:07,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 389/17840 [38:16<25:58:00, 5.36s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:36:17,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 389/17840 [38:16<25:58:00, 5.36s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:36:17,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:19,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:17,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 390/17840 [38:21<25:10:59, 5.20s/it]g-point operations will not be computed-18 09:36:17,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 390/17840 [38:21<25:10:59, 5.20s/it]g-point operations will not be computed-18 09:36:17,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:23,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:17,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:23,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:17,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:23,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:17,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 391/17840 [38:26<24:22:12, 5.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:36:26,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:28,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:26,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:28,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:26,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 392/17840 [38:30<23:32:07, 4.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:36:30,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:32,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:30,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:32,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:30,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 393/17840 [38:34<22:26:41, 4.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:36:35,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:36,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:35,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:36,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:35,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 394/17840 [38:38<21:27:56, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:36:38,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 395/17840 [38:42<20:19:24, 4.19s/it]g-point operations will not be computed-18 09:36:38,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 395/17840 [38:42<20:19:24, 4.19s/it]g-point operations will not be computed-18 09:36:38,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 395/17840 [38:42<20:19:24, 4.19s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:36:42,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 396/17840 [38:45<18:55:58, 3.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:36:45,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 396/17840 [38:45<18:55:58, 3.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:36:45,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 397/17840 [38:48<17:22:53, 3.59s/it]g-point operations will not be computed-18 09:36:45,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 397/17840 [38:48<17:22:53, 3.59s/it]g-point operations will not be computed-18 09:36:45,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:49,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:48,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:49,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:48,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:51,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:50,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:51,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:50,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:36:53,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:52,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 400/17840 [38:55<13:40:07, 2.82s/it]g-point operations will not be computed-18 09:36:52,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 400/17840 [38:55<13:40:07, 2.82s/it]g-point operations will not be computed-18 09:36:52,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 400/17840 [38:55<13:40:07, 2.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:36:57,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 400/17840 [38:55<13:40:07, 2.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:36:57,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:37:00,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:36:57,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 401/17840 [39:03<21:02:20, 4.34s/it]g-point operations will not be computed-18 09:36:57,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 401/17840 [39:03<21:02:20, 4.34s/it]g-point operations will not be computed-18 09:36:57,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 401/17840 [39:03<21:02:20, 4.34s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:37:04,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 401/17840 [39:03<21:02:20, 4.34s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:37:04,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [39:11<25:34:39, 5.28s/it]g-point operations will not be computed-18 09:37:04,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [39:11<25:34:39, 5.28s/it]g-point operations will not be computed-18 09:37:04,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [39:11<25:34:39, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [39:11<25:34:39, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 402/17840 [39:11<25:34:39, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 403/17840 [39:18<28:45:26, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 403/17840 [39:18<28:45:26, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3407, 'learning_rate': 4e-05, 'epoch': 0.45} + 2%|█▋ | 403/17840 [39:18<28:45:26, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 403/17840 [39:18<28:45:26, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 404/17840 [39:25<30:40:05, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 404/17840 [39:25<30:40:05, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:37:28,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:37:28,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 405/17840 [39:32<31:53:05, 6.58s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 405/17840 [39:32<31:53:05, 6.58s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4073, 'learning_rate': 4.02e-05, 'epoch': 0.45} + 2%|█▋ | 405/17840 [39:32<31:53:05, 6.58s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 405/17840 [39:32<31:53:05, 6.58s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 406/17840 [39:40<32:49:07, 6.78s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 406/17840 [39:40<32:49:07, 6.78s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2966, 'learning_rate': 4.0300000000000004e-05, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-18 09:37:44,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [39:47<33:21:31, 6.89s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [39:47<33:21:31, 6.89s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3111, 'learning_rate': 4.0400000000000006e-05, 'epoch': 0.46} + 2%|█▋ | 407/17840 [39:47<33:21:31, 6.89s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [39:47<33:21:31, 6.89s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 408/17840 [39:54<33:48:28, 6.98s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 408/17840 [39:54<33:48:28, 6.98s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1803, 'learning_rate': 4.05e-05, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-18 09:37:59,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:37:59,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 409/17840 [40:01<33:52:18, 7.00s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 409/17840 [40:01<33:52:18, 7.00s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 409/17840 [40:01<33:52:18, 7.00s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 409/17840 [40:01<33:52:18, 7.00s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 409/17840 [40:01<33:52:18, 7.00s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 410/17840 [40:08<34:00:40, 7.02s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 410/17840 [40:08<34:00:40, 7.02s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:38:13,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:38:13,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 411/17840 [40:15<33:56:35, 7.01s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 411/17840 [40:15<33:56:35, 7.01s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 411/17840 [40:15<33:56:35, 7.01s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 411/17840 [40:15<33:56:35, 7.01s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 411/17840 [40:15<33:56:35, 7.01s/it]g-point operations will not be computed-18 09:37:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 412/17840 [40:22<33:50:47, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:38:23,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 412/17840 [40:22<33:50:47, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:38:23,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 412/17840 [40:22<33:50:47, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:38:23,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 412/17840 [40:22<33:50:47, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:38:23,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 413/17840 [40:29<33:33:09, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:38:23,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:38:32,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:38:23,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:38:32,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:38:23,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:38:32,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:38:23,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 414/17840 [40:36<33:26:52, 6.91s/it]g-point operations will not be computed-18 09:38:23,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 414/17840 [40:36<33:26:52, 6.91s/it]g-point operations will not be computed-18 09:38:23,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 414/17840 [40:36<33:26:52, 6.91s/it]g-point operations will not be computed-18 09:38:23,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 414/17840 [40:36<33:26:52, 6.91s/it]g-point operations will not be computed-18 09:38:23,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 414/17840 [40:36<33:26:52, 6.91s/it]g-point operations will not be computed-18 09:38:23,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 415/17840 [40:43<33:20:44, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 415/17840 [40:43<33:20:44, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 415/17840 [40:43<33:20:44, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 415/17840 [40:43<33:20:44, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 416/17840 [40:49<33:08:31, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 416/17840 [40:49<33:08:31, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:38:54,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:38:54,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 417/17840 [40:56<32:51:19, 6.79s/it]g-point operations will not be computed-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 417/17840 [40:56<32:51:19, 6.79s/it]g-point operations will not be computed-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 417/17840 [40:56<32:51:19, 6.79s/it]g-point operations will not be computed-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:02,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:02,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3631, 'learning_rate': 4.15e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:02,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:02,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:02,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:38:44,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [41:09<32:37:52, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [41:09<32:37:52, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [41:09<32:37:52, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [41:09<32:37:52, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 420/17840 [41:16<32:17:12, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:18,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:18,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:18,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 421/17840 [41:22<32:11:12, 6.65s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 421/17840 [41:22<32:11:12, 6.65s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:27,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 422/17840 [41:29<32:00:49, 6.62s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 422/17840 [41:29<32:00:49, 6.62s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3556, 'learning_rate': 4.19e-05, 'epoch': 0.47} + 2%|█▊ | 422/17840 [41:29<32:00:49, 6.62s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:35,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:35,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3351, 'learning_rate': 4.2e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:35,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:41,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:41,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3065, 'learning_rate': 4.21e-05, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:41,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:41,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 425/17840 [41:49<32:06:56, 6.64s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 425/17840 [41:49<32:06:56, 6.64s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:51,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:51,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:51,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 426/17840 [41:55<31:44:50, 6.56s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:58,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:58,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:39:58,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 427/17840 [42:01<31:17:07, 6.47s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 427/17840 [42:01<31:17:07, 6.47s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:05,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:05,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 428/17840 [42:08<30:54:18, 6.39s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 428/17840 [42:08<30:54:18, 6.39s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:11,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 429/17840 [42:14<30:26:22, 6.29s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 429/17840 [42:14<30:26:22, 6.29s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2802, 'learning_rate': 4.26e-05, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:17,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 430/17840 [42:20<30:05:02, 6.22s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 430/17840 [42:20<30:05:02, 6.22s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3824, 'learning_rate': 4.27e-05, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:24,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:24,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 431/17840 [42:26<29:49:54, 6.17s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:28,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:28,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:28,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 432/17840 [42:32<29:25:24, 6.08s/it]g-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:34,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:34,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:34,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:39:10,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 433/17840 [42:38<29:12:03, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:40:38,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 433/17840 [42:38<29:12:03, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:40:38,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 433/17840 [42:38<29:12:03, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:40:38,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 433/17840 [42:38<29:12:03, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:40:38,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 434/17840 [42:43<28:59:12, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:40:44,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 434/17840 [42:43<28:59:12, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:40:44,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 434/17840 [42:43<28:59:12, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:40:44,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 434/17840 [42:43<28:59:12, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:40:44,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 435/17840 [42:49<28:31:25, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:40:50,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 435/17840 [42:49<28:31:25, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:40:50,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:54,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:40:50,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:54,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:40:50,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4746, 'learning_rate': 4.33e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:58,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:40:50,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:40:58,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:40:50,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 437/17840 [43:00<27:45:10, 5.74s/it]g-point operations will not be computed-18 09:40:50,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:02,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:40:50,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:02,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:40:50,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:02,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:40:50,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 438/17840 [43:06<27:07:49, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:41:06,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:09,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:06,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 439/17840 [43:11<26:33:54, 5.50s/it]g-point operations will not be computed-18 09:41:06,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 439/17840 [43:11<26:33:54, 5.50s/it]g-point operations will not be computed-18 09:41:06,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:13,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:06,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:15,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:06,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:15,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:06,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2574, 'learning_rate': 4.3700000000000005e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:19,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:06,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 441/17840 [43:21<24:56:33, 5.16s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 441/17840 [43:21<24:56:33, 5.16s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:23,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 442/17840 [43:25<23:57:38, 4.96s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 442/17840 [43:25<23:57:38, 4.96s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:26,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:28,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:28,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:31,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:32,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:32,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:34,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:36,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:36,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:39,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:39,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:41,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:44,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:44,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:45,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:45,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:47,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:47,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:49,923 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:49,923 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9296, 'learning_rate': 4.47e-05, 'epoch': 0.5} +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:53,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:53,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:57,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:41:57,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3197, 'learning_rate': 4.4800000000000005e-05, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:01,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:01,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:05,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:05,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3162, 'learning_rate': 4.49e-05, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:05,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:12,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:12,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:12,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4748, 'learning_rate': 4.5e-05, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:12,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 454/17840 [44:20<30:10:56, 6.25s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 454/17840 [44:20<30:10:56, 6.25s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.107, 'learning_rate': 4.5100000000000005e-05, 'epoch': 0.51} + 3%|█▉ | 454/17840 [44:20<30:10:56, 6.25s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 454/17840 [44:20<30:10:56, 6.25s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:26,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:26,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:26,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:26,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:26,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 456/17840 [44:34<32:14:12, 6.68s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 456/17840 [44:34<32:14:12, 6.68s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 456/17840 [44:34<32:14:12, 6.68s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 456/17840 [44:34<32:14:12, 6.68s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:40,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:40,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:40,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:40,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:40,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 458/17840 [44:48<33:23:12, 6.91s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 458/17840 [44:48<33:23:12, 6.91s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:42:53,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 459/17840 [44:55<33:37:10, 6.96s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 459/17840 [44:55<33:37:10, 6.96s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.386, 'learning_rate': 4.5600000000000004e-05, 'epoch': 0.51} + 3%|█▉ | 459/17840 [44:55<33:37:10, 6.96s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 459/17840 [44:55<33:37:10, 6.96s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 459/17840 [44:55<33:37:10, 6.96s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 460/17840 [45:02<33:36:23, 6.96s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 460/17840 [45:02<33:36:23, 6.96s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:07,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:07,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 461/17840 [45:09<33:34:00, 6.95s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 461/17840 [45:09<33:34:00, 6.95s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 461/17840 [45:09<33:34:00, 6.95s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:15,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:15,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2382, 'learning_rate': 4.5900000000000004e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:15,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:15,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:15,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 463/17840 [45:23<33:25:19, 6.92s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 463/17840 [45:23<33:25:19, 6.92s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:27,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 464/17840 [45:30<33:11:56, 6.88s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 464/17840 [45:30<33:11:56, 6.88s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1281, 'learning_rate': 4.61e-05, 'epoch': 0.52} + 3%|█▉ | 464/17840 [45:30<33:11:56, 6.88s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:36,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:36,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3115, 'learning_rate': 4.6200000000000005e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:36,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:36,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:36,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 466/17840 [45:43<32:51:23, 6.81s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:46,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:46,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:46,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 467/17840 [45:50<32:42:55, 6.78s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 467/17840 [45:50<32:42:55, 6.78s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:43:54,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 468/17840 [45:57<32:27:31, 6.73s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 468/17840 [45:57<32:27:31, 6.73s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1019, 'learning_rate': 4.6500000000000005e-05, 'epoch': 0.52} + 3%|█▉ | 468/17840 [45:57<32:27:31, 6.73s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 468/17840 [45:57<32:27:31, 6.73s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 468/17840 [45:57<32:27:31, 6.73s/it]g-point operations will not be computed-18 09:41:21,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 469/17840 [46:03<32:21:40, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 469/17840 [46:03<32:21:40, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 469/17840 [46:03<32:21:40, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 469/17840 [46:03<32:21:40, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 470/17840 [46:10<32:07:31, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:12,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:12,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:12,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 471/17840 [46:16<31:50:58, 6.60s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 471/17840 [46:16<31:50:58, 6.60s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:20,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 472/17840 [46:23<31:37:58, 6.56s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 472/17840 [46:23<31:37:58, 6.56s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1289, 'learning_rate': 4.69e-05, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:27,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 473/17840 [46:29<31:22:56, 6.51s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 473/17840 [46:29<31:22:56, 6.51s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.343, 'learning_rate': 4.7e-05, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:33,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 474/17840 [46:35<31:06:15, 6.45s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 474/17840 [46:35<31:06:15, 6.45s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3209, 'learning_rate': 4.71e-05, 'epoch': 0.53} + 3%|██ | 474/17840 [46:35<31:06:15, 6.45s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 474/17840 [46:35<31:06:15, 6.45s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 474/17840 [46:35<31:06:15, 6.45s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 475/17840 [46:42<31:39:08, 6.56s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:45,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:45,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:45,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 476/17840 [46:49<31:15:04, 6.48s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:51,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:51,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:51,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 477/17840 [46:55<30:52:37, 6.40s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:57,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:57,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:44:57,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 478/17840 [47:01<30:30:51, 6.33s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:03,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:03,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:03,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 479/17840 [47:07<30:10:12, 6.26s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:09,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:09,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:09,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 480/17840 [47:13<29:54:14, 6.20s/it]g-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:15,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:15,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:15,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:44:04,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 481/17840 [47:19<29:32:54, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:45:20,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 481/17840 [47:19<29:32:54, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:45:20,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:24,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:20,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:24,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:20,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1576, 'learning_rate': 4.79e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:24,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:20,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:24,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:20,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:24,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:20,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 483/17840 [47:31<28:48:52, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:45:31,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:34,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:31,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 484/17840 [47:36<28:23:16, 5.89s/it]g-point operations will not be computed-18 09:45:31,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 484/17840 [47:36<28:23:16, 5.89s/it]g-point operations will not be computed-18 09:45:31,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:38,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:31,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:38,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:31,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 485/17840 [47:42<27:51:37, 5.78s/it]g-point operations will not be computed-18 09:45:31,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 485/17840 [47:42<27:51:37, 5.78s/it]g-point operations will not be computed-18 09:45:31,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:44,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:31,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:44,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:31,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:44,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:31,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 486/17840 [47:47<27:27:58, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:45:48,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 486/17840 [47:47<27:27:58, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:45:48,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:52,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:48,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:52,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:48,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:55,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:48,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:55,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:48,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:45:55,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:48,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 488/17840 [47:58<26:29:43, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:45:59,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 488/17840 [47:58<26:29:43, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:45:59,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:46:02,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:59,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:46:02,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:59,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2781, 'learning_rate': 4.86e-05, 'epoch': 0.55} +[WARNING|modeling_utils.py:388] 2022-03-18 09:46:06,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:59,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:46:06,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:45:59,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 490/17840 [48:08<25:01:35, 5.19s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:08,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:46:11,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:46:08,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 491/17840 [48:12<24:02:31, 4.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:13,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 491/17840 [48:12<24:02:31, 4.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:13,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:46:15,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:46:13,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 492/17840 [48:17<23:00:01, 4.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:17,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 492/17840 [48:17<23:00:01, 4.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:17,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:46:19,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:46:17,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 493/17840 [48:21<21:43:21, 4.51s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:21,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 493/17840 [48:21<21:43:21, 4.51s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:21,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:46:23,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:46:21,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:46:23,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:46:21,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 494/17840 [48:24<20:17:16, 4.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:24,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 495/17840 [48:27<18:51:44, 3.91s/it]g-point operations will not be computed-18 09:46:24,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 495/17840 [48:27<18:51:44, 3.91s/it]g-point operations will not be computed-18 09:46:24,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:46:29,333 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:46:27,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:46:29,333 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:46:27,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 496/17840 [48:30<17:27:47, 3.62s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:30,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 497/17840 [48:33<16:07:53, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:33,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 497/17840 [48:33<16:07:53, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:33,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 498/17840 [48:35<14:43:20, 3.06s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:35,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 498/17840 [48:35<14:43:20, 3.06s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:35,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 499/17840 [48:38<13:27:02, 2.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:37,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 499/17840 [48:38<13:27:02, 2.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:37,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 500/17840 [48:40<12:57:05, 2.69s/it]g-point operations will not be computed-18 09:46:37,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 500/17840 [48:40<12:57:05, 2.69s/it]g-point operations will not be computed-18 09:46:37,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 500/17840 [48:40<12:57:05, 2.69s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:41,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 500/17840 [48:40<12:57:05, 2.69s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:41,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:46:45,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:46:41,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 501/17840 [48:48<20:10:09, 4.19s/it]g-point operations will not be computed-18 09:46:41,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 501/17840 [48:48<20:10:09, 4.19s/it]g-point operations will not be computed-18 09:46:41,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 501/17840 [48:48<20:10:09, 4.19s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:49,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 501/17840 [48:48<20:10:09, 4.19s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:49,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:46:53,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:46:49,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [48:55<24:55:29, 5.18s/it]g-point operations will not be computed-18 09:46:49,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [48:55<24:55:29, 5.18s/it]g-point operations will not be computed-18 09:46:49,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [48:55<24:55:29, 5.18s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:56,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 502/17840 [48:55<24:55:29, 5.18s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:46:56,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:47:02,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:46:56,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:47:02,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:46:56,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4261, 'learning_rate': 5e-05, 'epoch': 0.56} +[WARNING|modeling_utils.py:388] 2022-03-18 09:47:02,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:46:56,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:47:02,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:46:56,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 504/17840 [49:10<29:59:42, 6.23s/it]g-point operations will not be computed-18 09:46:56,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 504/17840 [49:10<29:59:42, 6.23s/it]g-point operations will not be computed-18 09:46:56,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3206, 'learning_rate': 5.0100000000000005e-05, 'epoch': 0.57} + 3%|██▏ | 504/17840 [49:10<29:59:42, 6.23s/it]g-point operations will not be computed-18 09:46:56,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 504/17840 [49:10<29:59:42, 6.23s/it]g-point operations will not be computed-18 09:46:56,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 504/17840 [49:10<29:59:42, 6.23s/it]g-point operations will not be computed-18 09:46:56,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 505/17840 [49:17<31:20:48, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 505/17840 [49:17<31:20:48, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 505/17840 [49:17<31:20:48, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 505/17840 [49:17<31:20:48, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [49:24<32:09:26, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [49:24<32:09:26, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [49:24<32:09:26, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [49:24<32:09:26, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:47:30,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:47:30,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:47:30,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:47:30,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:47:30,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 508/17840 [49:38<33:05:32, 6.87s/it]g-point operations will not be computed-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 508/17840 [49:38<33:05:32, 6.87s/it]g-point operations will not be computed-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:47:43,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:47:43,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [49:45<33:22:01, 6.93s/it]g-point operations will not be computed-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [49:45<33:22:01, 6.93s/it]g-point operations will not be computed-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [49:45<33:22:01, 6.93s/it]g-point operations will not be computed-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [49:45<33:22:01, 6.93s/it]g-point operations will not be computed-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [49:45<33:22:01, 6.93s/it]g-point operations will not be computed-18 09:47:18,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 510/17840 [49:52<33:28:05, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:47:56,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:47:56,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 511/17840 [49:59<33:19:59, 6.92s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 511/17840 [49:59<33:19:59, 6.92s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 511/17840 [49:59<33:19:59, 6.92s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:05,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:05,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2494, 'learning_rate': 5.0900000000000004e-05, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:05,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:05,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:05,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 513/17840 [50:13<33:07:08, 6.88s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 513/17840 [50:13<33:07:08, 6.88s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:17,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 514/17840 [50:19<33:05:05, 6.87s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 514/17840 [50:19<33:05:05, 6.87s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2406, 'learning_rate': 5.11e-05, 'epoch': 0.58} + 3%|██▏ | 514/17840 [50:19<33:05:05, 6.87s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:25,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:25,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3145, 'learning_rate': 5.1200000000000004e-05, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:25,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:25,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:25,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 516/17840 [50:33<32:45:06, 6.81s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:36,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:36,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:36,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 517/17840 [50:40<32:31:22, 6.76s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 517/17840 [50:40<32:31:22, 6.76s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:48:44,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 518/17840 [50:46<32:20:48, 6.72s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 518/17840 [50:46<32:20:48, 6.72s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2704, 'learning_rate': 5.1500000000000005e-05, 'epoch': 0.58} + 3%|██▏ | 518/17840 [50:46<32:20:48, 6.72s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 518/17840 [50:46<32:20:48, 6.72s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 518/17840 [50:46<32:20:48, 6.72s/it]g-point operations will not be computed-18 09:47:53,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 519/17840 [50:53<32:13:12, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 519/17840 [50:53<32:13:12, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 519/17840 [50:53<32:13:12, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 519/17840 [50:53<32:13:12, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 520/17840 [50:59<31:58:28, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:49:02,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:49:02,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:49:02,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 521/17840 [51:06<31:53:28, 6.63s/it]g-point operations will not be computed-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 521/17840 [51:06<31:53:28, 6.63s/it]g-point operations will not be computed-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:49:10,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 522/17840 [51:12<31:39:46, 6.58s/it]g-point operations will not be computed-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 522/17840 [51:12<31:39:46, 6.58s/it]g-point operations will not be computed-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2017, 'learning_rate': 5.19e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-18 09:49:17,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 523/17840 [51:19<31:26:52, 6.54s/it]g-point operations will not be computed-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 523/17840 [51:19<31:26:52, 6.54s/it]g-point operations will not be computed-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2755, 'learning_rate': 5.2000000000000004e-05, 'epoch': 0.59} + 3%|██▏ | 523/17840 [51:19<31:26:52, 6.54s/it]g-point operations will not be computed-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 523/17840 [51:19<31:26:52, 6.54s/it]g-point operations will not be computed-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 523/17840 [51:19<31:26:52, 6.54s/it]g-point operations will not be computed-18 09:48:54,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 524/17840 [51:25<31:12:57, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 524/17840 [51:25<31:12:57, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 524/17840 [51:25<31:12:57, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 524/17840 [51:25<31:12:57, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 525/17840 [51:32<31:47:04, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 525/17840 [51:32<31:47:04, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:49:36,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:49:36,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 526/17840 [51:38<31:20:41, 6.52s/it]g-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 526/17840 [51:38<31:20:41, 6.52s/it]g-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:49:42,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 527/17840 [51:45<31:02:38, 6.46s/it]g-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 527/17840 [51:45<31:02:38, 6.46s/it]g-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2972, 'learning_rate': 5.2400000000000007e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-18 09:49:49,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:49:49,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 528/17840 [51:51<30:39:24, 6.38s/it]g-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 528/17840 [51:51<30:39:24, 6.38s/it]g-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:49:55,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:49:55,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 529/17840 [51:57<30:18:23, 6.30s/it]g-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 529/17840 [51:57<30:18:23, 6.30s/it]g-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:01,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:01,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 530/17840 [52:03<29:57:03, 6.23s/it]g-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 530/17840 [52:03<29:57:03, 6.23s/it]g-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:07,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:07,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 531/17840 [52:09<29:34:35, 6.15s/it]g-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 531/17840 [52:09<29:34:35, 6.15s/it]g-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:13,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:13,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 532/17840 [52:15<29:14:28, 6.08s/it]g-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:17,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:17,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:17,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:49:26,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 533/17840 [52:21<28:43:19, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:50:21,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 533/17840 [52:21<28:43:19, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:50:21,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:26,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:21,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:26,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:21,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1809, 'learning_rate': 5.31e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:26,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:21,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:31,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:21,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:31,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:21,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3227, 'learning_rate': 5.3200000000000006e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:36,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:21,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:36,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:21,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 536/17840 [52:38<27:38:49, 5.75s/it]g-point operations will not be computed-18 09:50:21,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:40,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:21,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:40,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:21,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:40,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:21,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 537/17840 [52:43<27:15:31, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:50:44,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 537/17840 [52:43<27:15:31, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:50:44,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:48,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:44,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:48,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:44,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4979, 'learning_rate': 5.3500000000000006e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:51,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:44,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:51,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:44,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 539/17840 [52:53<25:50:37, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 539/17840 [52:53<25:50:37, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:57,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:50:57,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:00,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:02,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:02,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:04,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:06,299 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:06,299 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:08,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:10,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:10,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:11,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:13,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:13,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:16,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:16,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:18,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:18,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:19,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:22,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:22,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:24,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:24,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:26,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:26,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:27,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:27,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:29,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:29,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:33,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:36,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:36,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1631, 'learning_rate': 5.4800000000000004e-05, 'epoch': 0.62} +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:40,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:40,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:44,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:44,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.478, 'learning_rate': 5.4900000000000006e-05, 'epoch': 0.62} +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:48,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:48,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:48,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 553/17840 [53:52<27:56:45, 5.82s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 553/17840 [53:52<27:56:45, 5.82s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:51:57,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 554/17840 [53:59<29:47:59, 6.21s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 554/17840 [53:59<29:47:59, 6.21s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2782, 'learning_rate': 5.5100000000000004e-05, 'epoch': 0.62} + 3%|██▎ | 554/17840 [53:59<29:47:59, 6.21s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 554/17840 [53:59<29:47:59, 6.21s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 554/17840 [53:59<29:47:59, 6.21s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 555/17840 [54:06<31:07:55, 6.48s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:52:09,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:52:09,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [54:13<32:07:29, 6.69s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [54:13<32:07:29, 6.69s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3003, 'learning_rate': 5.530000000000001e-05, 'epoch': 0.62} + 3%|██▎ | 556/17840 [54:13<32:07:29, 6.69s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [54:13<32:07:29, 6.69s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [54:13<32:07:29, 6.69s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 557/17840 [54:20<32:35:48, 6.79s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 557/17840 [54:20<32:35:48, 6.79s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:52:25,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 558/17840 [54:28<33:01:27, 6.88s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 558/17840 [54:28<33:01:27, 6.88s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2154, 'learning_rate': 5.550000000000001e-05, 'epoch': 0.63} + 3%|██▍ | 558/17840 [54:28<33:01:27, 6.88s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 558/17840 [54:28<33:01:27, 6.88s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 558/17840 [54:28<33:01:27, 6.88s/it]g-point operations will not be computed-18 09:50:54,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 559/17840 [54:34<33:07:36, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:52:35,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 559/17840 [54:34<33:07:36, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:52:35,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 559/17840 [54:34<33:07:36, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:52:35,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 560/17840 [54:41<33:09:37, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:52:35,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 560/17840 [54:41<33:09:37, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:52:35,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1834, 'learning_rate': 5.5700000000000005e-05, 'epoch': 0.63} + 3%|██▍ | 560/17840 [54:41<33:09:37, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:52:35,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:52:47,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:35,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:52:47,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:35,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4362, 'learning_rate': 5.580000000000001e-05, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-18 09:52:47,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:35,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:52:47,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:35,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:52:47,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:35,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 562/17840 [54:55<33:01:14, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 562/17840 [54:55<33:01:14, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 562/17840 [54:55<33:01:14, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 563/17840 [55:02<32:45:23, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 563/17840 [55:02<32:45:23, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:04,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:04,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [55:09<32:37:53, 6.80s/it]g-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [55:09<32:37:53, 6.80s/it]g-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2289, 'learning_rate': 5.610000000000001e-05, 'epoch': 0.63} + 3%|██▍ | 564/17840 [55:09<32:37:53, 6.80s/it]g-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:14,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:14,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3864, 'learning_rate': 5.620000000000001e-05, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:14,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:14,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 566/17840 [55:22<32:24:10, 6.75s/it]g-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 566/17840 [55:22<32:24:10, 6.75s/it]g-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:25,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:25,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [55:29<32:14:28, 6.72s/it]g-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [55:29<32:14:28, 6.72s/it]g-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.266, 'learning_rate': 5.6399999999999995e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:33,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 568/17840 [55:35<32:03:19, 6.68s/it]g-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 568/17840 [55:35<32:03:19, 6.68s/it]g-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2271, 'learning_rate': 5.65e-05, 'epoch': 0.64} + 3%|██▍ | 568/17840 [55:35<32:03:19, 6.68s/it]g-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:41,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:41,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3536, 'learning_rate': 5.66e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:41,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:47,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:47,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2307, 'learning_rate': 5.6699999999999996e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:47,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:47,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:53:47,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:52:56,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 571/17840 [55:55<31:26:45, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 571/17840 [55:55<31:26:45, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 571/17840 [55:55<31:26:45, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 571/17840 [55:55<31:26:45, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 572/17840 [56:01<31:11:41, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:03,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:03,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:03,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 573/17840 [56:07<30:56:11, 6.45s/it]g-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 573/17840 [56:07<30:56:11, 6.45s/it]g-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:11,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:11,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 574/17840 [56:14<30:41:35, 6.40s/it]g-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 574/17840 [56:14<30:41:35, 6.40s/it]g-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:18,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:18,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 575/17840 [56:21<31:19:11, 6.53s/it]g-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 575/17840 [56:21<31:19:11, 6.53s/it]g-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 575/17840 [56:21<31:19:11, 6.53s/it]g-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:26,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:26,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2469, 'learning_rate': 5.73e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:26,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:32,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:32,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3052, 'learning_rate': 5.74e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:32,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:38,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:38,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4057, 'learning_rate': 5.7499999999999995e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:38,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:44,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:44,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9485, 'learning_rate': 5.76e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:44,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:44,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:54:44,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:53:56,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 580/17840 [56:51<29:43:48, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:54:52,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 580/17840 [56:51<29:43:48, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:54:52,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 580/17840 [56:51<29:43:48, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:54:52,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 580/17840 [56:51<29:43:48, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:54:52,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 581/17840 [56:57<29:25:45, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 581/17840 [56:57<29:25:45, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:02,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:02,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2476, 'learning_rate': 5.79e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:07,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:07,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 583/17840 [57:09<28:48:54, 6.01s/it]g-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:11,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:11,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:11,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 584/17840 [57:15<28:18:20, 5.91s/it]g-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:17,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:20,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:20,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4622, 'learning_rate': 5.82e-05, 'epoch': 0.66} +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:20,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:25,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:25,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3631, 'learning_rate': 5.83e-05, 'epoch': 0.66} +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:25,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:25,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:31,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:33,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:33,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:33,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:54:58,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 588/17840 [57:37<26:29:31, 5.53s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:55:37,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 588/17840 [57:37<26:29:31, 5.53s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:55:37,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:41,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:37,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:41,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:37,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:44,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:37,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:44,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:37,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:44,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:37,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 590/17840 [57:47<25:20:22, 5.29s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:50,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:50,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 591/17840 [57:51<24:33:49, 5.13s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:53,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:55,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:55,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:55:58,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:00,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:00,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:02,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:03,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:03,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:05,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:05,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:07,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:10,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:10,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:12,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:12,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:13,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:15,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:15,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:18,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:18,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:19,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:19,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:20,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:24,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:24,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:28,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:28,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3338, 'learning_rate': 5.9800000000000003e-05, 'epoch': 0.67} +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:35,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:35,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:35,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:42,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:42,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3321, 'learning_rate': 6e-05, 'epoch': 0.68} +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:42,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:42,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [58:50<29:46:15, 6.22s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [58:50<29:46:15, 6.22s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4139, 'learning_rate': 6.0100000000000004e-05, 'epoch': 0.68} + 3%|██▌ | 604/17840 [58:50<29:46:15, 6.22s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:57,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:57,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2934, 'learning_rate': 6.02e-05, 'epoch': 0.68} +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:57,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:57,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:56:57,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 606/17840 [59:04<31:53:03, 6.66s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 606/17840 [59:04<31:53:03, 6.66s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 606/17840 [59:04<31:53:03, 6.66s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:57:11,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:57:11,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.408, 'learning_rate': 6.04e-05, 'epoch': 0.68} +[WARNING|modeling_utils.py:388] 2022-03-18 09:57:11,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:57:11,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 608/17840 [59:18<32:44:10, 6.84s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 608/17840 [59:18<32:44:10, 6.84s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:57:21,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:57:21,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 609/17840 [59:25<32:54:34, 6.88s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 609/17840 [59:25<32:54:34, 6.88s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2808, 'learning_rate': 6.06e-05, 'epoch': 0.68} +[WARNING|modeling_utils.py:388] 2022-03-18 09:57:30,326 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 610/17840 [59:32<32:52:40, 6.87s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 610/17840 [59:32<32:52:40, 6.87s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3081, 'learning_rate': 6.07e-05, 'epoch': 0.68} + 3%|██▌ | 610/17840 [59:32<32:52:40, 6.87s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 610/17840 [59:32<32:52:40, 6.87s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 611/17840 [59:39<32:52:17, 6.87s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 611/17840 [59:39<32:52:17, 6.87s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:57:42,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:57:42,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 612/17840 [59:46<32:44:38, 6.84s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 612/17840 [59:46<32:44:38, 6.84s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4525, 'learning_rate': 6.09e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-18 09:57:50,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:57:50,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [59:53<32:31:04, 6.80s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [59:53<32:31:04, 6.80s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [59:53<32:31:04, 6.80s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [59:53<32:31:04, 6.80s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [59:53<32:31:04, 6.80s/it]g-point operations will not be computed-18 09:55:47,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 614/17840 [59:59<32:15:59, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 614/17840 [59:59<32:15:59, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 614/17840 [59:59<32:15:59, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 614/17840 [59:59<32:15:59, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 615/17840 [1:00:06<32:06:53, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:08,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:08,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:08,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 616/17840 [1:00:12<31:56:01, 6.67s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 616/17840 [1:00:12<31:56:01, 6.67s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:17,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:17,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 617/17840 [1:00:19<31:45:37, 6.64s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 617/17840 [1:00:19<31:45:37, 6.64s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 617/17840 [1:00:19<31:45:37, 6.64s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:25,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:25,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1818, 'learning_rate': 6.15e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:25,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:31,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:31,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3438, 'learning_rate': 6.16e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:31,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:31,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:31,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 620/17840 [1:00:39<31:23:16, 6.56s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:41,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:41,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:41,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 621/17840 [1:00:45<31:17:24, 6.54s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 621/17840 [1:00:45<31:17:24, 6.54s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:49,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:49,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 622/17840 [1:00:52<31:13:31, 6.53s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 622/17840 [1:00:52<31:13:31, 6.53s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:56,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:58:56,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 623/17840 [1:00:58<31:10:05, 6.52s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 623/17840 [1:00:58<31:10:05, 6.52s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 623/17840 [1:00:58<31:10:05, 6.52s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:04,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:04,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2597, 'learning_rate': 6.21e-05, 'epoch': 0.7} +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:04,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:04,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:04,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 625/17840 [1:01:11<31:37:11, 6.61s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 625/17840 [1:01:11<31:37:11, 6.61s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:15,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:15,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 626/17840 [1:01:18<31:14:06, 6.53s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 626/17840 [1:01:18<31:14:06, 6.53s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:22,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:22,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 627/17840 [1:01:24<30:46:00, 6.43s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 627/17840 [1:01:24<30:46:00, 6.43s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:28,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:28,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 628/17840 [1:01:30<30:21:50, 6.35s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:32,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:32,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:32,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 629/17840 [1:01:36<30:02:02, 6.28s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:39,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:39,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:39,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 630/17840 [1:01:42<29:50:40, 6.24s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:45,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:45,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:45,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 631/17840 [1:01:48<29:30:26, 6.17s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:51,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:51,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:51,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▌ | 632/17840 [1:01:54<29:09:27, 6.10s/it]g-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:57,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:57,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 09:59:57,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 09:58:00,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 633/17840 [1:02:00<28:52:00, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:01,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 633/17840 [1:02:00<28:52:00, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:01,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 633/17840 [1:02:00<28:52:00, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:01,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 633/17840 [1:02:00<28:52:00, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:01,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 634/17840 [1:02:06<28:30:02, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:09,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 635/17840 [1:02:12<28:03:16, 5.87s/it]g-point operations will not be computed-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 635/17840 [1:02:12<28:03:16, 5.87s/it]g-point operations will not be computed-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5151, 'learning_rate': 6.32e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:15,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 636/17840 [1:02:17<27:39:00, 5.79s/it]g-point operations will not be computed-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 636/17840 [1:02:17<27:39:00, 5.79s/it]g-point operations will not be computed-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:19,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:22,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:22,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3032, 'learning_rate': 6.340000000000001e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:26,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 638/17840 [1:02:28<26:45:53, 5.60s/it]g-point operations will not be computed-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 638/17840 [1:02:28<26:45:53, 5.60s/it]g-point operations will not be computed-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:30,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:30,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:07,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 639/17840 [1:02:33<26:12:43, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:34,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 639/17840 [1:02:33<26:12:43, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:34,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3386, 'learning_rate': 6.36e-05, 'epoch': 0.72} +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:38,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:34,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:38,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:34,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:40,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:34,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:42,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:34,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:42,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:34,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2517, 'learning_rate': 6.38e-05, 'epoch': 0.72} +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:46,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:34,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 642/17840 [1:02:48<23:54:07, 5.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:48,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 642/17840 [1:02:48<23:54:07, 5.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:48,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:50,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:48,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 643/17840 [1:02:52<22:37:28, 4.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:52,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 643/17840 [1:02:52<22:37:28, 4.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:52,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:00:54,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:00:52,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 644/17840 [1:02:56<21:23:34, 4.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:56,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 644/17840 [1:02:56<21:23:34, 4.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:56,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 645/17840 [1:02:59<20:05:15, 4.21s/it]g-point operations will not be computed-18 10:00:56,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 645/17840 [1:02:59<20:05:15, 4.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:59,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 645/17840 [1:02:59<20:05:15, 4.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:00:59,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 646/17840 [1:03:03<18:44:43, 3.92s/it]g-point operations will not be computed-18 10:00:59,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 646/17840 [1:03:03<18:44:43, 3.92s/it]g-point operations will not be computed-18 10:00:59,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:01:04,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:01:03,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 647/17840 [1:03:06<17:19:56, 3.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:05,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 647/17840 [1:03:06<17:19:56, 3.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:05,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 648/17840 [1:03:08<15:53:27, 3.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:08,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 648/17840 [1:03:08<15:53:27, 3.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:08,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 649/17840 [1:03:10<14:21:43, 3.01s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:10,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 649/17840 [1:03:10<14:21:43, 3.01s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:10,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 650/17840 [1:03:13<13:36:16, 2.85s/it]g-point operations will not be computed-18 10:01:10,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 650/17840 [1:03:13<13:36:16, 2.85s/it]g-point operations will not be computed-18 10:01:10,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 650/17840 [1:03:13<13:36:16, 2.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:14,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 650/17840 [1:03:13<13:36:16, 2.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:14,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:01:18,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:01:14,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:01:18,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:01:14,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 651/17840 [1:03:21<20:47:45, 4.36s/it]g-point operations will not be computed-18 10:01:14,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 651/17840 [1:03:21<20:47:45, 4.36s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 651/17840 [1:03:21<20:47:45, 4.36s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:01:26,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:01:26,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 652/17840 [1:03:28<25:06:51, 5.26s/it]g-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 652/17840 [1:03:28<25:06:51, 5.26s/it]g-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:01:33,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:01:33,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:03:35<27:59:00, 5.86s/it]g-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:03:35<27:59:00, 5.86s/it]g-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:03:35<27:59:00, 5.86s/it]g-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:03:35<27:59:00, 5.86s/it]g-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 653/17840 [1:03:35<27:59:00, 5.86s/it]g-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 654/17840 [1:03:43<29:53:45, 6.26s/it]g-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 654/17840 [1:03:43<29:53:45, 6.26s/it]g-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 654/17840 [1:03:43<29:53:45, 6.26s/it]g-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:01:49,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:01:49,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3676, 'learning_rate': 6.52e-05, 'epoch': 0.73} +[WARNING|modeling_utils.py:388] 2022-03-18 10:01:49,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:01:49,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:01:49,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:01:22,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 656/17840 [1:03:57<31:53:38, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:58,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 656/17840 [1:03:57<31:53:38, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:58,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 656/17840 [1:03:57<31:53:38, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:58,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 656/17840 [1:03:57<31:53:38, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:58,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 657/17840 [1:04:04<32:20:47, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:58,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 657/17840 [1:04:04<32:20:47, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:58,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 657/17840 [1:04:04<32:20:47, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:58,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 657/17840 [1:04:04<32:20:47, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:58,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 657/17840 [1:04:04<32:20:47, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:01:58,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 658/17840 [1:04:11<32:37:51, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 658/17840 [1:04:11<32:37:51, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 658/17840 [1:04:11<32:37:51, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 658/17840 [1:04:11<32:37:51, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 659/17840 [1:04:18<32:47:09, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 659/17840 [1:04:18<32:47:09, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:02:22,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 660/17840 [1:04:25<32:50:09, 6.88s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 660/17840 [1:04:25<32:50:09, 6.88s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6014, 'learning_rate': 6.570000000000001e-05, 'epoch': 0.74} + 4%|██▋ | 660/17840 [1:04:25<32:50:09, 6.88s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 660/17840 [1:04:25<32:50:09, 6.88s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 660/17840 [1:04:25<32:50:09, 6.88s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 661/17840 [1:04:32<32:51:48, 6.89s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:02:34,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:02:34,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:02:34,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:04:38<32:56:26, 6.90s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:04:38<32:56:26, 6.90s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 662/17840 [1:04:38<32:56:26, 6.90s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:02:44,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:02:44,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5777, 'learning_rate': 6.6e-05, 'epoch': 0.74} +[WARNING|modeling_utils.py:388] 2022-03-18 10:02:44,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:02:44,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:02:44,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 664/17840 [1:04:52<32:21:42, 6.78s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:02:54,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:02:54,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:02:54,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 665/17840 [1:04:59<32:17:47, 6.77s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 665/17840 [1:04:59<32:17:47, 6.77s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:03,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 666/17840 [1:05:05<32:06:51, 6.73s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 666/17840 [1:05:05<32:06:51, 6.73s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5372, 'learning_rate': 6.630000000000001e-05, 'epoch': 0.75} + 4%|██▊ | 666/17840 [1:05:05<32:06:51, 6.73s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:11,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:11,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2061, 'learning_rate': 6.64e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:11,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:18,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:18,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4104, 'learning_rate': 6.65e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:18,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:18,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:18,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 669/17840 [1:05:25<31:35:52, 6.62s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:27,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:27,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 670/17840 [1:05:31<31:29:48, 6.60s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 670/17840 [1:05:31<31:29:48, 6.60s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:34,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:34,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 671/17840 [1:05:38<31:13:34, 6.55s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 671/17840 [1:05:38<31:13:34, 6.55s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1917, 'learning_rate': 6.680000000000001e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:42,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 672/17840 [1:05:44<31:01:51, 6.51s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 672/17840 [1:05:44<31:01:51, 6.51s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3141, 'learning_rate': 6.690000000000001e-05, 'epoch': 0.75} + 4%|██▊ | 672/17840 [1:05:44<31:01:51, 6.51s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:50,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:50,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1279, 'learning_rate': 6.7e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:50,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:56,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:56,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1696, 'learning_rate': 6.71e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:56,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:03:56,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 675/17840 [1:06:04<31:14:46, 6.55s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 675/17840 [1:06:04<31:14:46, 6.55s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:06,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:06,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 676/17840 [1:06:10<30:58:31, 6.50s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 676/17840 [1:06:10<30:58:31, 6.50s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:13,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:13,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 677/17840 [1:06:16<30:35:42, 6.42s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 677/17840 [1:06:16<30:35:42, 6.42s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:19,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:19,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 678/17840 [1:06:23<30:10:34, 6.33s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 678/17840 [1:06:23<30:10:34, 6.33s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0379, 'learning_rate': 6.750000000000001e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:26,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 679/17840 [1:06:29<30:01:29, 6.30s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 679/17840 [1:06:29<30:01:29, 6.30s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2339, 'learning_rate': 6.76e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:33,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 680/17840 [1:06:35<29:44:21, 6.24s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 680/17840 [1:06:35<29:44:21, 6.24s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5472, 'learning_rate': 6.77e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:39,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 681/17840 [1:06:41<29:31:34, 6.19s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 681/17840 [1:06:41<29:31:34, 6.19s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5944, 'learning_rate': 6.780000000000001e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:45,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:06:47<29:07:53, 6.11s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:06:47<29:07:53, 6.11s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:49,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:49,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:49,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 683/17840 [1:06:53<28:49:35, 6.05s/it]g-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:55,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:55,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:04:55,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:02:12,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 684/17840 [1:06:59<28:24:13, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:04:59,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:02,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:04:59,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 685/17840 [1:07:04<28:02:02, 5.88s/it]g-point operations will not be computed-18 10:04:59,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 685/17840 [1:07:04<28:02:02, 5.88s/it]g-point operations will not be computed-18 10:04:59,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5406, 'learning_rate': 6.82e-05, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:08,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:04:59,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 686/17840 [1:07:10<27:35:52, 5.79s/it]g-point operations will not be computed-18 10:04:59,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 686/17840 [1:07:10<27:35:52, 5.79s/it]g-point operations will not be computed-18 10:04:59,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:12,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:04:59,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:12,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:04:59,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 687/17840 [1:07:15<27:05:47, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:05:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 687/17840 [1:07:15<27:05:47, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:05:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3253, 'learning_rate': 6.840000000000001e-05, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:20,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:20,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4927, 'learning_rate': 6.850000000000001e-05, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:24,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 689/17840 [1:07:26<26:09:24, 5.49s/it]g-point operations will not be computed-18 10:05:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 689/17840 [1:07:26<26:09:24, 5.49s/it]g-point operations will not be computed-18 10:05:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:28,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:30,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:30,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6683, 'learning_rate': 6.87e-05, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:34,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:16,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 691/17840 [1:07:36<24:57:00, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 691/17840 [1:07:36<24:57:00, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3221, 'learning_rate': 6.879999999999999e-05, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:40,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:40,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:42,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:44,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:44,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:46,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:48,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:48,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:50,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:50,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:53,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:53,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:54,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:56,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:56,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:59,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:05:59,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:01,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:01,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:03,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:03,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:04,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:04,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:08,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:08,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:08,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:12,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:12,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:16,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:16,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:16,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:20,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:20,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:25,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:25,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:08:28<27:43:47, 5.83s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:08:28<27:43:47, 5.83s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:08:28<27:43:47, 5.83s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:08:28<27:43:47, 5.83s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:08:28<27:43:47, 5.83s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:08:35<29:41:49, 6.24s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:08:35<29:41:49, 6.24s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:08:35<29:41:49, 6.24s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:08:35<29:41:49, 6.24s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:41,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:41,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:41,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:41,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:41,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 706/17840 [1:08:49<31:51:19, 6.69s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 706/17840 [1:08:49<31:51:19, 6.69s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:06:54,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 707/17840 [1:08:56<32:31:28, 6.83s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 707/17840 [1:08:56<32:31:28, 6.83s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.421, 'learning_rate': 7.04e-05, 'epoch': 0.79} + 4%|██▉ | 707/17840 [1:08:56<32:31:28, 6.83s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 707/17840 [1:08:56<32:31:28, 6.83s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 707/17840 [1:08:56<32:31:28, 6.83s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 708/17840 [1:09:03<32:52:34, 6.91s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 708/17840 [1:09:03<32:52:34, 6.91s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:08,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:08,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 709/17840 [1:09:10<33:08:21, 6.96s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 709/17840 [1:09:10<33:08:21, 6.96s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 709/17840 [1:09:10<33:08:21, 6.96s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 709/17840 [1:09:10<33:08:21, 6.96s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 709/17840 [1:09:10<33:08:21, 6.96s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 710/17840 [1:09:17<33:11:31, 6.98s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:20,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:20,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:20,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 711/17840 [1:09:24<33:01:34, 6.94s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 711/17840 [1:09:24<33:01:34, 6.94s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 711/17840 [1:09:24<33:01:34, 6.94s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:30,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:30,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.263, 'learning_rate': 7.09e-05, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:30,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:30,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:30,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 713/17840 [1:09:38<32:57:14, 6.93s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:41,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:41,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:41,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 714/17840 [1:09:45<32:47:39, 6.89s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 714/17840 [1:09:45<32:47:39, 6.89s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:49,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 715/17840 [1:09:52<32:28:47, 6.83s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 715/17840 [1:09:52<32:28:47, 6.83s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.525, 'learning_rate': 7.12e-05, 'epoch': 0.8} + 4%|██▉ | 715/17840 [1:09:52<32:28:47, 6.83s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:58,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:58,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1788, 'learning_rate': 7.13e-05, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:58,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:58,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:07:58,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 717/17840 [1:10:05<32:06:46, 6.75s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:08:08,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:08:08,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 718/17840 [1:10:12<31:49:28, 6.69s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 718/17840 [1:10:12<31:49:28, 6.69s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2138, 'learning_rate': 7.15e-05, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-18 10:08:16,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 719/17840 [1:10:18<31:39:37, 6.66s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 719/17840 [1:10:18<31:39:37, 6.66s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9823, 'learning_rate': 7.16e-05, 'epoch': 0.81} + 4%|██▉ | 719/17840 [1:10:18<31:39:37, 6.66s/it]g-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:08:24,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:08:24,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3374, 'learning_rate': 7.17e-05, 'epoch': 0.81} +[WARNING|modeling_utils.py:388] 2022-03-18 10:08:24,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:08:24,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:08:24,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:05:36,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 721/17840 [1:10:31<31:25:45, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 721/17840 [1:10:31<31:25:45, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 721/17840 [1:10:31<31:25:45, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 722/17840 [1:10:38<31:16:55, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 722/17840 [1:10:38<31:16:55, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:08:40,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:08:40,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 723/17840 [1:10:44<31:06:11, 6.54s/it]g-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 723/17840 [1:10:44<31:06:11, 6.54s/it]g-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:08:47,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:08:47,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 724/17840 [1:10:51<30:50:07, 6.49s/it]g-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 724/17840 [1:10:51<30:50:07, 6.49s/it]g-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4879, 'learning_rate': 7.21e-05, 'epoch': 0.81} +[WARNING|modeling_utils.py:388] 2022-03-18 10:08:55,054 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2617, 'learning_rate': 7.22e-05, 'epoch': 0.81} + g-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:03,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:03,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5736, 'learning_rate': 7.23e-05, 'epoch': 0.81} +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:03,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3347, 'learning_rate': 7.24e-05, 'epoch': 0.82} +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:15,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:15,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3685, 'learning_rate': 7.25e-05, 'epoch': 0.82} +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:15,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:21,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:21,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1945, 'learning_rate': 7.26e-05, 'epoch': 0.82} +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:21,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:21,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:27,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:27,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:32,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:32,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 731/17840 [1:11:34<29:08:40, 6.13s/it]g-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 731/17840 [1:11:34<29:08:40, 6.13s/it]g-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:38,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:38,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 732/17840 [1:11:40<28:50:16, 6.07s/it]g-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:42,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:42,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:42,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 733/17840 [1:11:46<28:25:01, 5.98s/it]g-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:48,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:48,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:48,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:08:32,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 734/17840 [1:11:51<27:53:03, 5.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 734/17840 [1:11:51<27:53:03, 5.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:56,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:09:56,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1264, 'learning_rate': 7.32e-05, 'epoch': 0.82} +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:00,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:00,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 736/17840 [1:12:02<26:57:06, 5.67s/it]g-point operations will not be computed-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:04,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:07,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:07,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4901, 'learning_rate': 7.340000000000001e-05, 'epoch': 0.83} +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:11,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:11,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 738/17840 [1:12:13<25:54:00, 5.45s/it]g-point operations will not be computed-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:15,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:15,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:15,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:09:52,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 739/17840 [1:12:18<25:14:00, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:10:18,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:21,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:18,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:21,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:18,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 740/17840 [1:12:23<24:33:13, 5.17s/it]g-point operations will not be computed-18 10:10:18,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:24,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:18,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:27,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:18,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:27,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:18,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:29,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:18,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:31,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:18,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:31,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:18,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:33,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:18,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:33,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:18,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:33,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:18,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 743/17840 [1:12:36<22:13:06, 4.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:10:36,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 744/17840 [1:12:40<21:11:59, 4.46s/it]g-point operations will not be computed-18 10:10:36,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 744/17840 [1:12:40<21:11:59, 4.46s/it]g-point operations will not be computed-18 10:10:36,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 744/17840 [1:12:40<21:11:59, 4.46s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:10:40,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 745/17840 [1:12:44<20:00:54, 4.21s/it]g-point operations will not be computed-18 10:10:40,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 745/17840 [1:12:44<20:00:54, 4.21s/it]g-point operations will not be computed-18 10:10:40,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 745/17840 [1:12:44<20:00:54, 4.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:10:44,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 745/17840 [1:12:44<20:00:54, 4.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:10:44,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 746/17840 [1:12:47<18:41:24, 3.94s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:10:47,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 747/17840 [1:12:50<17:12:41, 3.62s/it]g-point operations will not be computed-18 10:10:47,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 747/17840 [1:12:50<17:12:41, 3.62s/it]g-point operations will not be computed-18 10:10:47,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:51,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:50,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:51,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:50,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:54,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:52,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:10:54,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:52,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 749/17840 [1:12:55<14:21:37, 3.02s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:10:55,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 750/17840 [1:12:57<13:40:17, 2.88s/it]g-point operations will not be computed-18 10:10:55,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 750/17840 [1:12:57<13:40:17, 2.88s/it]g-point operations will not be computed-18 10:10:55,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 750/17840 [1:12:57<13:40:17, 2.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:10:59,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 750/17840 [1:12:57<13:40:17, 2.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:10:59,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:11:03,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:59,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:11:03,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:10:59,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 751/17840 [1:13:05<20:35:43, 4.34s/it]g-point operations will not be computed-18 10:10:59,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 751/17840 [1:13:05<20:35:43, 4.34s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:06,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 751/17840 [1:13:05<20:35:43, 4.34s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:06,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:13:13<25:02:52, 5.28s/it]g-point operations will not be computed-18 10:11:06,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:13:13<25:02:52, 5.28s/it]g-point operations will not be computed-18 10:11:06,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:13:13<25:02:52, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:13:13<25:02:52, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:13:13<25:02:52, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:13:20<27:59:19, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:13:20<27:59:19, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3605, 'learning_rate': 7.500000000000001e-05, 'epoch': 0.84} + 4%|███ | 753/17840 [1:13:20<27:59:19, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:13:20<27:59:19, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:13:20<27:59:19, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 754/17840 [1:13:27<29:54:51, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:11:30,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:11:30,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 755/17840 [1:13:34<31:10:57, 6.57s/it]g-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 755/17840 [1:13:34<31:10:57, 6.57s/it]g-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4604, 'learning_rate': 7.52e-05, 'epoch': 0.85} + 4%|███▏ | 755/17840 [1:13:34<31:10:57, 6.57s/it]g-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 755/17840 [1:13:34<31:10:57, 6.57s/it]g-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 755/17840 [1:13:34<31:10:57, 6.57s/it]g-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 756/17840 [1:13:42<32:03:57, 6.76s/it]g-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:11:44,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:11:44,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:13:49<32:25:39, 6.83s/it]g-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:13:49<32:25:39, 6.83s/it]g-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.52, 'learning_rate': 7.54e-05, 'epoch': 0.85} + 4%|███▏ | 757/17840 [1:13:49<32:25:39, 6.83s/it]g-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:13:49<32:25:39, 6.83s/it]g-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:13:49<32:25:39, 6.83s/it]g-point operations will not be computed-18 10:11:14,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 758/17840 [1:13:56<32:37:58, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 758/17840 [1:13:56<32:37:58, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 758/17840 [1:13:56<32:37:58, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 759/17840 [1:14:03<32:49:10, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 759/17840 [1:14:03<32:49:10, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2417, 'learning_rate': 7.560000000000001e-05, 'epoch': 0.85} + 4%|███▏ | 759/17840 [1:14:03<32:49:10, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:12:09,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:12:09,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2927, 'learning_rate': 7.570000000000001e-05, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-18 10:12:09,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:12:09,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:12:09,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 761/17840 [1:14:16<32:44:04, 6.90s/it]g-point operations will not be computed-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 761/17840 [1:14:16<32:44:04, 6.90s/it]g-point operations will not be computed-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:12:21,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 762/17840 [1:14:23<32:45:08, 6.90s/it]g-point operations will not be computed-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 762/17840 [1:14:23<32:45:08, 6.90s/it]g-point operations will not be computed-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3332, 'learning_rate': 7.59e-05, 'epoch': 0.85} + 4%|███▏ | 762/17840 [1:14:23<32:45:08, 6.90s/it]g-point operations will not be computed-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 762/17840 [1:14:23<32:45:08, 6.90s/it]g-point operations will not be computed-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 762/17840 [1:14:23<32:45:08, 6.90s/it]g-point operations will not be computed-18 10:11:57,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 763/17840 [1:14:30<32:36:21, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 763/17840 [1:14:30<32:36:21, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 763/17840 [1:14:30<32:36:21, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 764/17840 [1:14:37<32:33:58, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 764/17840 [1:14:37<32:33:58, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2678, 'learning_rate': 7.61e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-18 10:12:41,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 765/17840 [1:14:44<32:28:34, 6.85s/it]g-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 765/17840 [1:14:44<32:28:34, 6.85s/it]g-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4164, 'learning_rate': 7.620000000000001e-05, 'epoch': 0.86} + 4%|███▏ | 765/17840 [1:14:44<32:28:34, 6.85s/it]g-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:12:50,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:12:50,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2911, 'learning_rate': 7.630000000000001e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-18 10:12:50,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:12:50,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 767/17840 [1:14:57<32:09:34, 6.78s/it]g-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 767/17840 [1:14:57<32:09:34, 6.78s/it]g-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:00,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:00,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 768/17840 [1:15:04<31:54:28, 6.73s/it]g-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 768/17840 [1:15:04<31:54:28, 6.73s/it]g-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3816, 'learning_rate': 7.65e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:08,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 769/17840 [1:15:10<31:44:22, 6.69s/it]g-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 769/17840 [1:15:10<31:44:22, 6.69s/it]g-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3576, 'learning_rate': 7.66e-05, 'epoch': 0.86} + 4%|███▏ | 769/17840 [1:15:10<31:44:22, 6.69s/it]g-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:16,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:16,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3447, 'learning_rate': 7.670000000000001e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:16,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:16,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:16,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:12:31,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 771/17840 [1:15:23<31:21:12, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 771/17840 [1:15:23<31:21:12, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 771/17840 [1:15:23<31:21:12, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 772/17840 [1:15:30<31:12:22, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 772/17840 [1:15:30<31:12:22, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:33,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:33,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 773/17840 [1:15:37<31:07:05, 6.56s/it]g-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 773/17840 [1:15:37<31:07:05, 6.56s/it]g-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:39,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:39,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 774/17840 [1:15:43<30:52:33, 6.51s/it]g-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 774/17840 [1:15:43<30:52:33, 6.51s/it]g-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0431, 'learning_rate': 7.71e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:47,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 775/17840 [1:15:50<31:09:24, 6.57s/it]g-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 775/17840 [1:15:50<31:09:24, 6.57s/it]g-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0756, 'learning_rate': 7.72e-05, 'epoch': 0.87} + 4%|███▏ | 775/17840 [1:15:50<31:09:24, 6.57s/it]g-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:55,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:55,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4031, 'learning_rate': 7.730000000000001e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:55,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:13:55,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:01,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:01,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:01,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:01,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:07,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:07,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:07,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:07,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:14,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:14,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:14,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:14,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:20,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:20,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:24,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:24,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 781/17840 [1:16:26<29:07:10, 6.15s/it]g-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 781/17840 [1:16:26<29:07:10, 6.15s/it]g-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 781/17840 [1:16:26<29:07:10, 6.15s/it]g-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 781/17840 [1:16:26<29:07:10, 6.15s/it]g-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:32,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:32,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:36,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:36,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 783/17840 [1:16:38<28:30:40, 6.02s/it]g-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 783/17840 [1:16:38<28:30:40, 6.02s/it]g-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:42,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:42,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 784/17840 [1:16:44<28:08:17, 5.94s/it]g-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:46,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:46,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:46,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:13:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 785/17840 [1:16:50<27:35:24, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 785/17840 [1:16:50<27:35:24, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:54,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:54,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1325, 'learning_rate': 7.83e-05, 'epoch': 0.88} +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:58,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:14:58,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 787/17840 [1:17:00<26:39:48, 5.63s/it]g-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:02,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:05,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:05,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4398, 'learning_rate': 7.850000000000001e-05, 'epoch': 0.88} +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:09,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:09,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 789/17840 [1:17:11<25:39:32, 5.42s/it]g-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:13,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:15,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:15,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2772, 'learning_rate': 7.87e-05, 'epoch': 0.89} +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:19,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:19,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:14:50,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 791/17840 [1:17:21<24:24:48, 5.16s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:23,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 792/17840 [1:17:25<23:34:53, 4.98s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 792/17840 [1:17:25<23:34:53, 4.98s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:27,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:29,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:29,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:31,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:33,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:33,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:35,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:35,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:36,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:39,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:39,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:41,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:41,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:44,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:45,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:45,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:47,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:47,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:50,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:50,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5779, 'learning_rate': 7.970000000000001e-05, 'epoch': 0.9} +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:54,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:54,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:58,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:15:58,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4934, 'learning_rate': 7.98e-05, 'epoch': 0.9} +[WARNING|modeling_utils.py:388] 2022-03-18 10:16:01,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:16:01,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:16:05,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:16:05,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.334, 'learning_rate': 7.99e-05, 'epoch': 0.9} +[WARNING|modeling_utils.py:388] 2022-03-18 10:16:05,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:16:12,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:16:12,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5514, 'learning_rate': 8e-05, 'epoch': 0.9} +[WARNING|modeling_utils.py:388] 2022-03-18 10:16:12,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:16:12,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:18:20<29:30:45, 6.24s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:18:20<29:30:45, 6.24s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3268, 'learning_rate': 8.010000000000001e-05, 'epoch': 0.9} +[WARNING|modeling_utils.py:388] 2022-03-18 10:16:25,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 805/17840 [1:18:27<30:48:14, 6.51s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 805/17840 [1:18:27<30:48:14, 6.51s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0859, 'learning_rate': 8.020000000000001e-05, 'epoch': 0.9} + 5%|███▎ | 805/17840 [1:18:27<30:48:14, 6.51s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 805/17840 [1:18:27<30:48:14, 6.51s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 805/17840 [1:18:27<30:48:14, 6.51s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 806/17840 [1:18:34<31:32:36, 6.67s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 806/17840 [1:18:34<31:32:36, 6.67s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:16:39,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 807/17840 [1:18:41<32:03:19, 6.78s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 807/17840 [1:18:41<32:03:19, 6.78s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4434, 'learning_rate': 8.04e-05, 'epoch': 0.9} + 5%|███▎ | 807/17840 [1:18:41<32:03:19, 6.78s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 807/17840 [1:18:41<32:03:19, 6.78s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 807/17840 [1:18:41<32:03:19, 6.78s/it]g-point operations will not be computed-18 10:15:21,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 808/17840 [1:18:48<32:15:58, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:16:49,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 808/17840 [1:18:48<32:15:58, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:16:49,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 808/17840 [1:18:48<32:15:58, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:16:49,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 809/17840 [1:18:55<32:19:34, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:16:49,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 809/17840 [1:18:55<32:19:34, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:16:49,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4699, 'learning_rate': 8.060000000000001e-05, 'epoch': 0.91} +[WARNING|modeling_utils.py:388] 2022-03-18 10:16:59,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:16:49,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 810/17840 [1:19:02<32:21:51, 6.84s/it]g-point operations will not be computed-18 10:16:49,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 810/17840 [1:19:02<32:21:51, 6.84s/it]g-point operations will not be computed-18 10:16:49,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1764, 'learning_rate': 8.070000000000001e-05, 'epoch': 0.91} + 5%|███▎ | 810/17840 [1:19:02<32:21:51, 6.84s/it]g-point operations will not be computed-18 10:16:49,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 810/17840 [1:19:02<32:21:51, 6.84s/it]g-point operations will not be computed-18 10:16:49,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 811/17840 [1:19:09<32:17:34, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 811/17840 [1:19:09<32:17:34, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.507, 'learning_rate': 8.080000000000001e-05, 'epoch': 0.91} + 5%|███▎ | 811/17840 [1:19:09<32:17:34, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 812/17840 [1:19:15<32:09:02, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 812/17840 [1:19:15<32:09:02, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:17:18,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:17:18,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:17:18,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 813/17840 [1:19:22<32:04:13, 6.78s/it]g-point operations will not be computed-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 813/17840 [1:19:22<32:04:13, 6.78s/it]g-point operations will not be computed-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 813/17840 [1:19:22<32:04:13, 6.78s/it]g-point operations will not be computed-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:17:28,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:17:28,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3329, 'learning_rate': 8.11e-05, 'epoch': 0.91} +[WARNING|modeling_utils.py:388] 2022-03-18 10:17:28,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:17:28,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:17:28,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:10,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 815/17840 [1:19:36<31:43:50, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 815/17840 [1:19:36<31:43:50, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 815/17840 [1:19:36<31:43:50, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 815/17840 [1:19:36<31:43:50, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 816/17840 [1:19:42<31:33:48, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 816/17840 [1:19:42<31:33:48, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:17:46,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:17:46,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 817/17840 [1:19:49<31:17:32, 6.62s/it]g-point operations will not be computed-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 817/17840 [1:19:49<31:17:32, 6.62s/it]g-point operations will not be computed-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 817/17840 [1:19:49<31:17:32, 6.62s/it]g-point operations will not be computed-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:17:54,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:17:54,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3052, 'learning_rate': 8.15e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-18 10:17:54,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:01,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:01,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2881, 'learning_rate': 8.16e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:01,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:01,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:01,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:17:36,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 820/17840 [1:20:08<30:44:47, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 820/17840 [1:20:08<30:44:47, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 820/17840 [1:20:08<30:44:47, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 820/17840 [1:20:08<30:44:47, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 821/17840 [1:20:14<30:36:47, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:17,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:17,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:17,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 822/17840 [1:20:21<30:27:36, 6.44s/it]g-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:23,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:23,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:23,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 823/17840 [1:20:27<30:21:01, 6.42s/it]g-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:30,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:30,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:30,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 824/17840 [1:20:33<30:09:23, 6.38s/it]g-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 824/17840 [1:20:33<30:09:23, 6.38s/it]g-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:37,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:37,763 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 825/17840 [1:20:40<30:35:33, 6.47s/it]g-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 825/17840 [1:20:40<30:35:33, 6.47s/it]g-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 825/17840 [1:20:40<30:35:33, 6.47s/it]g-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:46,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:46,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3779, 'learning_rate': 8.23e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:46,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:52,108 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:52,108 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2513, 'learning_rate': 8.24e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:52,108 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:58,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:18:58,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1463, 'learning_rate': 8.25e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:02,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:02,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 829/17840 [1:21:04<29:00:32, 6.14s/it]g-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 829/17840 [1:21:04<29:00:32, 6.14s/it]g-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:08,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:08,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 830/17840 [1:21:10<28:42:53, 6.08s/it]g-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 830/17840 [1:21:10<28:42:53, 6.08s/it]g-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:14,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 831/17840 [1:21:16<28:35:07, 6.05s/it]g-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 831/17840 [1:21:16<28:35:07, 6.05s/it]g-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:19,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:19,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:19,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 832/17840 [1:21:22<28:22:58, 6.01s/it]g-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:24,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:24,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:24,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:18:09,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 833/17840 [1:21:28<28:08:48, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:19:29,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 833/17840 [1:21:28<28:08:48, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:19:29,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 833/17840 [1:21:28<28:08:48, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:19:29,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 833/17840 [1:21:28<28:08:48, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:19:29,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 834/17840 [1:21:34<27:40:24, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 834/17840 [1:21:34<27:40:24, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:38,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:38,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2492, 'learning_rate': 8.32e-05, 'epoch': 0.94} +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:42,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:42,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 836/17840 [1:21:45<26:43:42, 5.66s/it]g-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:47,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:49,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:49,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3848, 'learning_rate': 8.34e-05, 'epoch': 0.94} +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:53,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:53,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 838/17840 [1:21:55<25:34:08, 5.41s/it]g-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:57,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:59,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:19:59,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:02,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:02,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:02,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:19:34,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 840/17840 [1:22:05<23:58:57, 5.08s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:05,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:07,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:05,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:07,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:05,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 841/17840 [1:22:09<23:03:54, 4.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:09,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:11,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:09,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:11,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:09,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 842/17840 [1:22:13<21:58:55, 4.66s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:13,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:15,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:13,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:15,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:13,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 843/17840 [1:22:17<20:43:04, 4.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:17,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 844/17840 [1:22:20<19:33:22, 4.14s/it]g-point operations will not be computed-18 10:20:17,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 844/17840 [1:22:20<19:33:22, 4.14s/it]g-point operations will not be computed-18 10:20:17,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 844/17840 [1:22:20<19:33:22, 4.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:21,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 845/17840 [1:22:24<18:10:06, 3.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:24,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 845/17840 [1:22:24<18:10:06, 3.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:24,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 846/17840 [1:22:26<16:46:02, 3.55s/it]g-point operations will not be computed-18 10:20:24,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 846/17840 [1:22:26<16:46:02, 3.55s/it]g-point operations will not be computed-18 10:20:24,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:28,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:26,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:28,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:26,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 847/17840 [1:22:29<15:24:06, 3.26s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:29,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 848/17840 [1:22:31<14:08:32, 3.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:31,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 848/17840 [1:22:31<14:08:32, 3.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:31,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 849/17840 [1:22:34<12:57:50, 2.75s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:33,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 849/17840 [1:22:34<12:57:50, 2.75s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:33,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 850/17840 [1:22:36<12:32:37, 2.66s/it]g-point operations will not be computed-18 10:20:33,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 850/17840 [1:22:36<12:32:37, 2.66s/it]g-point operations will not be computed-18 10:20:33,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 850/17840 [1:22:36<12:32:37, 2.66s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:37,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 850/17840 [1:22:36<12:32:37, 2.66s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:37,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:41,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:37,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 851/17840 [1:22:44<19:39:38, 4.17s/it]g-point operations will not be computed-18 10:20:37,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 851/17840 [1:22:44<19:39:38, 4.17s/it]g-point operations will not be computed-18 10:20:37,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 851/17840 [1:22:44<19:39:38, 4.17s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:45,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 851/17840 [1:22:44<19:39:38, 4.17s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:45,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:49,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:45,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:49,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:45,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:22:51<24:16:32, 5.14s/it]g-point operations will not be computed-18 10:20:45,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:22:51<24:16:32, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 852/17840 [1:22:51<24:16:32, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:58,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:58,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.629, 'learning_rate': 8.5e-05, 'epoch': 0.96} +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:58,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:58,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:20:58,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 854/17840 [1:23:06<29:16:24, 6.20s/it]g-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 854/17840 [1:23:06<29:16:24, 6.20s/it]g-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:21:10,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:23:13<30:34:03, 6.48s/it]g-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:23:13<30:34:03, 6.48s/it]g-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2819, 'learning_rate': 8.52e-05, 'epoch': 0.96} + 5%|███▌ | 855/17840 [1:23:13<30:34:03, 6.48s/it]g-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:23:13<30:34:03, 6.48s/it]g-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 855/17840 [1:23:13<30:34:03, 6.48s/it]g-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 856/17840 [1:23:20<31:23:38, 6.65s/it]g-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 856/17840 [1:23:20<31:23:38, 6.65s/it]g-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:21:24,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 857/17840 [1:23:27<31:53:25, 6.76s/it]g-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 857/17840 [1:23:27<31:53:25, 6.76s/it]g-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4616, 'learning_rate': 8.54e-05, 'epoch': 0.96} + 5%|███▌ | 857/17840 [1:23:27<31:53:25, 6.76s/it]g-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 857/17840 [1:23:27<31:53:25, 6.76s/it]g-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 857/17840 [1:23:27<31:53:25, 6.76s/it]g-point operations will not be computed-18 10:20:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 858/17840 [1:23:34<32:02:05, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 858/17840 [1:23:34<32:02:05, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 858/17840 [1:23:34<32:02:05, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 859/17840 [1:23:40<32:04:28, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 859/17840 [1:23:40<32:04:28, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1367, 'learning_rate': 8.560000000000001e-05, 'epoch': 0.96} +[WARNING|modeling_utils.py:388] 2022-03-18 10:21:45,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 860/17840 [1:23:47<32:06:49, 6.81s/it]g-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 860/17840 [1:23:47<32:06:49, 6.81s/it]g-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.334, 'learning_rate': 8.57e-05, 'epoch': 0.96} + 5%|███▌ | 860/17840 [1:23:47<32:06:49, 6.81s/it]g-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:21:53,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:21:53,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5985, 'learning_rate': 8.58e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-18 10:21:53,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:21:53,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 862/17840 [1:24:01<31:51:52, 6.76s/it]g-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 862/17840 [1:24:01<31:51:52, 6.76s/it]g-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:03,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:03,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 863/17840 [1:24:07<31:43:47, 6.73s/it]g-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 863/17840 [1:24:07<31:43:47, 6.73s/it]g-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5156, 'learning_rate': 8.6e-05, 'epoch': 0.97} + 5%|███▌ | 863/17840 [1:24:07<31:43:47, 6.73s/it]g-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:13,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:13,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9826, 'learning_rate': 8.61e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:13,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:20,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:20,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.573, 'learning_rate': 8.620000000000001e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:20,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:20,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:20,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:21:35,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 866/17840 [1:24:27<31:14:52, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 866/17840 [1:24:27<31:14:52, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 866/17840 [1:24:27<31:14:52, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 866/17840 [1:24:27<31:14:52, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 867/17840 [1:24:34<31:01:52, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:36,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:36,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:36,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 868/17840 [1:24:40<30:54:14, 6.56s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 868/17840 [1:24:40<30:54:14, 6.56s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:44,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:44,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 869/17840 [1:24:47<30:43:19, 6.52s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 869/17840 [1:24:47<30:43:19, 6.52s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:50,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:50,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 870/17840 [1:24:53<30:23:01, 6.45s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 870/17840 [1:24:53<30:23:01, 6.45s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 870/17840 [1:24:53<30:23:01, 6.45s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 870/17840 [1:24:53<30:23:01, 6.45s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:58,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:58,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:58,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:22:58,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:05,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:05,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:09,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 873/17840 [1:25:12<29:49:33, 6.33s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 873/17840 [1:25:12<29:49:33, 6.33s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3634, 'learning_rate': 8.7e-05, 'epoch': 0.98} + 5%|███▌ | 873/17840 [1:25:12<29:49:33, 6.33s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 873/17840 [1:25:12<29:49:33, 6.33s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:17,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:17,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:17,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:24,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:24,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7002, 'learning_rate': 8.72e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:24,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:30,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:30,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4276, 'learning_rate': 8.730000000000001e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:30,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:36,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:36,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2804, 'learning_rate': 8.740000000000001e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:40,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 878/17840 [1:25:42<28:35:01, 6.07s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 878/17840 [1:25:42<28:35:01, 6.07s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2666, 'learning_rate': 8.75e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:46,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:46,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 879/17840 [1:25:48<28:06:02, 5.96s/it]g-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:50,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:50,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:50,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:22:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 880/17840 [1:25:53<27:29:47, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:23:54,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 880/17840 [1:25:53<27:29:47, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:23:54,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:58,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:23:54,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:23:58,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:23:54,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2366, 'learning_rate': 8.78e-05, 'epoch': 0.99} +[WARNING|modeling_utils.py:388] 2022-03-18 10:24:02,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:23:54,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 882/17840 [1:26:04<26:15:01, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:05,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 882/17840 [1:26:04<26:15:01, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:05,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4807, 'learning_rate': 8.790000000000001e-05, 'epoch': 0.99} +[WARNING|modeling_utils.py:388] 2022-03-18 10:24:08,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:05,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:24:08,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:05,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:24:11,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:05,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:24:13,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:05,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:24:13,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:05,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5712, 'learning_rate': 8.81e-05, 'epoch': 0.99} +[WARNING|modeling_utils.py:388] 2022-03-18 10:24:16,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:05,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:24:16,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:05,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 885/17840 [1:26:18<23:19:26, 4.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:19,056 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 886/17840 [1:26:22<22:04:55, 4.69s/it]g-point operations will not be computed-18 10:24:19,056 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 886/17840 [1:26:22<22:04:55, 4.69s/it]g-point operations will not be computed-18 10:24:19,056 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 886/17840 [1:26:22<22:04:55, 4.69s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:23,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 887/17840 [1:26:26<20:45:56, 4.41s/it]g-point operations will not be computed-18 10:24:23,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 887/17840 [1:26:26<20:45:56, 4.41s/it]g-point operations will not be computed-18 10:24:23,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 887/17840 [1:26:26<20:45:56, 4.41s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:26,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 888/17840 [1:26:29<19:17:29, 4.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:29,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 888/17840 [1:26:29<19:17:29, 4.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:29,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 889/17840 [1:26:32<17:40:39, 3.75s/it]g-point operations will not be computed-18 10:24:29,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 889/17840 [1:26:32<17:40:39, 3.75s/it]g-point operations will not be computed-18 10:24:29,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 889/17840 [1:26:32<17:40:39, 3.75s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:32,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 890/17840 [1:26:35<16:04:27, 3.41s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:35,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 890/17840 [1:26:35<16:04:27, 3.41s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:35,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 891/17840 [1:26:37<14:23:47, 3.06s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:37,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 891/17840 [1:26:37<14:23:47, 3.06s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:37,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 892/17840 [1:26:39<12:40:52, 2.69s/it]g-point operations will not be computed-18 10:24:37,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 892/17840 [1:26:39<12:40:52, 2.69s/it]g-point operations will not be computed-18 10:24:37,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 892/17840 [1:26:39<12:40:52, 2.69s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:41,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 892/17840 [1:26:39<12:40:52, 2.69s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:41,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:24:44,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:41,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 893/17840 [1:26:47<19:55:07, 4.23s/it]g-point operations will not be computed-18 10:24:41,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 893/17840 [1:26:47<19:55:07, 4.23s/it]g-point operations will not be computed-18 10:24:41,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 893/17840 [1:26:47<19:55:07, 4.23s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:48,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:24:52,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:48,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 894/17840 [1:26:54<24:27:50, 5.20s/it]g-point operations will not be computed-18 10:24:48,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 894/17840 [1:26:54<24:27:50, 5.20s/it]g-point operations will not be computed-18 10:24:48,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 894/17840 [1:26:54<24:27:50, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 894/17840 [1:26:54<24:27:50, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 894/17840 [1:26:54<24:27:50, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 895/17840 [1:27:02<27:20:48, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 895/17840 [1:27:02<27:20:48, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2175, 'learning_rate': 8.92e-05, 'epoch': 1.0} + 5%|███▋ | 895/17840 [1:27:02<27:20:48, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 895/17840 [1:27:02<27:20:48, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:25:08,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:25:08,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:25:08,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:25:08,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:25:08,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 897/17840 [1:27:16<30:28:28, 6.48s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 897/17840 [1:27:16<30:28:28, 6.48s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:25:20,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:25:20,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 898/17840 [1:27:23<31:28:25, 6.69s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 898/17840 [1:27:23<31:28:25, 6.69s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 898/17840 [1:27:23<31:28:25, 6.69s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 898/17840 [1:27:23<31:28:25, 6.69s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 898/17840 [1:27:23<31:28:25, 6.69s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 899/17840 [1:27:30<31:58:55, 6.80s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:25:33,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:25:33,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:27:38<32:55:58, 7.00s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:27:38<32:55:58, 7.00s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4204, 'learning_rate': 8.970000000000001e-05, 'epoch': 1.01} + 5%|███▋ | 900/17840 [1:27:38<32:55:58, 7.00s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:27:38<32:55:58, 7.00s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:27:38<32:55:58, 7.00s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:27:45<32:57:36, 7.00s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:27:45<32:57:36, 7.00s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:25:49,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:25:49,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 902/17840 [1:27:52<33:01:31, 7.02s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 902/17840 [1:27:52<33:01:31, 7.02s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 902/17840 [1:27:52<33:01:31, 7.02s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 902/17840 [1:27:52<33:01:31, 7.02s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 902/17840 [1:27:52<33:01:31, 7.02s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 903/17840 [1:27:59<33:03:42, 7.03s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:01,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 904/17840 [1:28:06<32:51:45, 6.99s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 904/17840 [1:28:06<32:51:45, 6.99s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:10,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 905/17840 [1:28:12<32:35:26, 6.93s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 905/17840 [1:28:12<32:35:26, 6.93s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.06, 'learning_rate': 9.020000000000001e-05, 'epoch': 1.01} + 5%|███▊ | 905/17840 [1:28:12<32:35:26, 6.93s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 905/17840 [1:28:12<32:35:26, 6.93s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 905/17840 [1:28:12<32:35:26, 6.93s/it]g-point operations will not be computed-18 10:24:55,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 906/17840 [1:28:19<32:17:49, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 906/17840 [1:28:19<32:17:49, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 906/17840 [1:28:19<32:17:49, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 906/17840 [1:28:19<32:17:49, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 907/17840 [1:28:26<32:12:47, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 907/17840 [1:28:26<32:12:47, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 907/17840 [1:28:26<32:12:47, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:32,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:32,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2448, 'learning_rate': 9.05e-05, 'epoch': 1.02} +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:32,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:38,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:38,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0648, 'learning_rate': 9.06e-05, 'epoch': 1.02} +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:38,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:38,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:38,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 910/17840 [1:28:46<31:44:37, 6.75s/it]g-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:48,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:48,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:48,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 911/17840 [1:28:52<31:28:15, 6.69s/it]g-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 911/17840 [1:28:52<31:28:15, 6.69s/it]g-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 911/17840 [1:28:52<31:28:15, 6.69s/it]g-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:58,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:58,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0749, 'learning_rate': 9.090000000000001e-05, 'epoch': 1.02} +[WARNING|modeling_utils.py:388] 2022-03-18 10:26:58,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:05,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:05,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0941, 'learning_rate': 9.1e-05, 'epoch': 1.02} +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:05,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:05,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:05,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:26:20,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 914/17840 [1:29:12<30:50:21, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 914/17840 [1:29:12<30:50:21, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 914/17840 [1:29:12<30:50:21, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 914/17840 [1:29:12<30:50:21, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 915/17840 [1:29:18<30:39:33, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 915/17840 [1:29:18<30:39:33, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:22,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:22,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 916/17840 [1:29:25<30:23:31, 6.46s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:27,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:27,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:27,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 917/17840 [1:29:31<30:08:24, 6.41s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 917/17840 [1:29:31<30:08:24, 6.41s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:35,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:35,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 918/17840 [1:29:37<29:56:41, 6.37s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 918/17840 [1:29:37<29:56:41, 6.37s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:41,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:41,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 919/17840 [1:29:43<29:38:23, 6.31s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 919/17840 [1:29:43<29:38:23, 6.31s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:47,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:47,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 920/17840 [1:29:50<29:22:44, 6.25s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 920/17840 [1:29:50<29:22:44, 6.25s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:53,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:53,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 921/17840 [1:29:56<29:07:17, 6.20s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:58,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:58,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:27:58,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 922/17840 [1:30:02<28:53:55, 6.15s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:04,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:04,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:04,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 923/17840 [1:30:08<28:45:30, 6.12s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:10,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:10,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:10,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 924/17840 [1:30:14<28:28:44, 6.06s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:16,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:16,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 925/17840 [1:30:20<28:55:23, 6.16s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 925/17840 [1:30:20<28:55:23, 6.16s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:22,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:22,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:22,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 926/17840 [1:30:26<28:24:26, 6.05s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:28,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:31,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:31,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1726, 'learning_rate': 9.240000000000001e-05, 'epoch': 1.04} +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:31,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:36,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:36,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2846, 'learning_rate': 9.250000000000001e-05, 'epoch': 1.04} +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:40,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 929/17840 [1:30:42<26:49:31, 5.71s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 929/17840 [1:30:42<26:49:31, 5.71s/it]g-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:44,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:44,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:44,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:27:13,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 930/17840 [1:30:48<26:17:00, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:28:48,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 930/17840 [1:30:48<26:17:00, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:28:48,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:52,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:48,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:52,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:48,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:55,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:48,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:55,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:48,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:28:55,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:48,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 932/17840 [1:30:58<24:52:50, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:01,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 933/17840 [1:31:03<24:06:05, 5.13s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 933/17840 [1:31:03<24:06:05, 5.13s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:04,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:06,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:06,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:09,054 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:11,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:11,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:13,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:15,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:15,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:16,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:18,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:18,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:21,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:21,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:23,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:26,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:26,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:27,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:27,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:29,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:29,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:31,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:31,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.144, 'learning_rate': 9.39e-05, 'epoch': 1.06} +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:35,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:35,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:38,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:38,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0666, 'learning_rate': 9.4e-05, 'epoch': 1.06} +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:42,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:42,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:42,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:46,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:50,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:29:50,126 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 945/17840 [1:31:54<27:09:25, 5.79s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 945/17840 [1:31:54<27:09:25, 5.79s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.278, 'learning_rate': 9.42e-05, 'epoch': 1.06} + 5%|███▉ | 945/17840 [1:31:54<27:09:25, 5.79s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 945/17840 [1:31:54<27:09:25, 5.79s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:32:01<29:08:32, 6.21s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:32:01<29:08:32, 6.21s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:30:04,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:30:04,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:30:04,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 947/17840 [1:32:08<30:31:04, 6.50s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 947/17840 [1:32:08<30:31:04, 6.50s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 947/17840 [1:32:08<30:31:04, 6.50s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 947/17840 [1:32:08<30:31:04, 6.50s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 947/17840 [1:32:08<30:31:04, 6.50s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 948/17840 [1:32:16<31:26:47, 6.70s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 948/17840 [1:32:16<31:26:47, 6.70s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 948/17840 [1:32:16<31:26:47, 6.70s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:30:22,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:30:22,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9222, 'learning_rate': 9.46e-05, 'epoch': 1.06} +[WARNING|modeling_utils.py:388] 2022-03-18 10:30:22,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:30:22,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 950/17840 [1:32:30<33:03:54, 7.05s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 950/17840 [1:32:30<33:03:54, 7.05s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.014, 'learning_rate': 9.47e-05, 'epoch': 1.07} + 5%|███▉ | 950/17840 [1:32:30<33:03:54, 7.05s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:30:37,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:30:37,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0089, 'learning_rate': 9.48e-05, 'epoch': 1.07} +[WARNING|modeling_utils.py:388] 2022-03-18 10:30:37,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:30:37,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:30:37,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 952/17840 [1:32:44<32:58:16, 7.03s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 952/17840 [1:32:44<32:58:16, 7.03s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:30:49,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:30:49,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 953/17840 [1:32:51<32:44:47, 6.98s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 953/17840 [1:32:51<32:44:47, 6.98s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 953/17840 [1:32:51<32:44:47, 6.98s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 953/17840 [1:32:51<32:44:47, 6.98s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 953/17840 [1:32:51<32:44:47, 6.98s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 954/17840 [1:32:58<32:47:16, 6.99s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 954/17840 [1:32:58<32:47:16, 6.99s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:03,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:03,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 955/17840 [1:33:05<32:40:10, 6.97s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 955/17840 [1:33:05<32:40:10, 6.97s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 955/17840 [1:33:05<32:40:10, 6.97s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 955/17840 [1:33:05<32:40:10, 6.97s/it]g-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:11,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:11,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:11,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:11,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:11,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:28:58,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 957/17840 [1:33:19<32:02:47, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:31:19,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 957/17840 [1:33:19<32:02:47, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:31:19,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 957/17840 [1:33:19<32:02:47, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:31:19,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 957/17840 [1:33:19<32:02:47, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:31:19,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 958/17840 [1:33:25<31:48:06, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:31:19,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:28,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:19,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:28,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:19,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:28,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:19,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 959/17840 [1:33:32<31:39:53, 6.75s/it]g-point operations will not be computed-18 10:31:19,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 959/17840 [1:33:32<31:39:53, 6.75s/it]g-point operations will not be computed-18 10:31:19,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 959/17840 [1:33:32<31:39:53, 6.75s/it]g-point operations will not be computed-18 10:31:19,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 959/17840 [1:33:32<31:39:53, 6.75s/it]g-point operations will not be computed-18 10:31:19,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8826, 'learning_rate': 9.57e-05, 'epoch': 1.08} + 5%|███▉ | 960/17840 [1:33:38<31:23:51, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 960/17840 [1:33:38<31:23:51, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 960/17840 [1:33:38<31:23:51, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 960/17840 [1:33:38<31:23:51, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 961/17840 [1:33:45<31:06:55, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:47,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:47,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:47,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 962/17840 [1:33:51<30:53:02, 6.59s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:54,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:54,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:31:54,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 963/17840 [1:33:58<30:40:10, 6.54s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 963/17840 [1:33:58<30:40:10, 6.54s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:02,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:02,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 964/17840 [1:34:04<30:25:32, 6.49s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 964/17840 [1:34:04<30:25:32, 6.49s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:08,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 965/17840 [1:34:11<30:16:36, 6.46s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 965/17840 [1:34:11<30:16:36, 6.46s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9186, 'learning_rate': 9.620000000000001e-05, 'epoch': 1.08} + 5%|████ | 965/17840 [1:34:11<30:16:36, 6.46s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:16,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:16,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1462, 'learning_rate': 9.63e-05, 'epoch': 1.08} +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:21,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 967/17840 [1:34:23<29:47:40, 6.36s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 967/17840 [1:34:23<29:47:40, 6.36s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1538, 'learning_rate': 9.64e-05, 'epoch': 1.08} + 5%|████ | 967/17840 [1:34:23<29:47:40, 6.36s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:28,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:28,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1535, 'learning_rate': 9.65e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:28,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:35,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:35,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9954, 'learning_rate': 9.66e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:35,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:41,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:41,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9148, 'learning_rate': 9.67e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:41,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:41,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:47,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:47,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:51,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 972/17840 [1:34:53<28:37:55, 6.11s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 972/17840 [1:34:53<28:37:55, 6.11s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1036, 'learning_rate': 9.69e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:57,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:32:57,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 973/17840 [1:34:59<28:23:24, 6.06s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:02,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:02,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:02,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 974/17840 [1:35:05<27:59:11, 5.97s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:07,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:07,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:07,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 975/17840 [1:35:12<28:24:40, 6.06s/it]g-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:14,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:14,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:14,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:31:39,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 976/17840 [1:35:17<27:54:36, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 976/17840 [1:35:17<27:54:36, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:22,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:22,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3465, 'learning_rate': 9.74e-05, 'epoch': 1.1} +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:26,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 978/17840 [1:35:28<26:50:14, 5.73s/it]g-point operations will not be computed-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 978/17840 [1:35:28<26:50:14, 5.73s/it]g-point operations will not be computed-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:30,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:30,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:30,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 979/17840 [1:35:34<26:19:40, 5.62s/it]g-point operations will not be computed-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:35,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:38,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:38,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3157, 'learning_rate': 9.77e-05, 'epoch': 1.1} +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:42,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:42,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:18,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 981/17840 [1:35:44<24:53:38, 5.32s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:47,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 982/17840 [1:35:48<24:10:47, 5.16s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 982/17840 [1:35:48<24:10:47, 5.16s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:50,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:52,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:52,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:54,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:56,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:56,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:33:58,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:00,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:00,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:02,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:04,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:04,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:07,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:07,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:09,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:11,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:11,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:12,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:12,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:15,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:15,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:17,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:17,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:19,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:19,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0895, 'learning_rate': 9.89e-05, 'epoch': 1.11} +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:23,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:23,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:26,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:26,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0623, 'learning_rate': 9.900000000000001e-05, 'epoch': 1.11} +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:30,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:30,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:34,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:34,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2533, 'learning_rate': 9.910000000000001e-05, 'epoch': 1.11} +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:37,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:41,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:41,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3767, 'learning_rate': 9.92e-05, 'epoch': 1.12} +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:41,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:41,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 996/17840 [1:36:49<28:44:14, 6.14s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 996/17840 [1:36:49<28:44:14, 6.14s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4277, 'learning_rate': 9.93e-05, 'epoch': 1.12} +[WARNING|modeling_utils.py:388] 2022-03-18 10:34:54,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 997/17840 [1:36:56<30:07:49, 6.44s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 997/17840 [1:36:56<30:07:49, 6.44s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0641, 'learning_rate': 9.94e-05, 'epoch': 1.12} + 6%|████▏ | 997/17840 [1:36:56<30:07:49, 6.44s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 997/17840 [1:36:56<30:07:49, 6.44s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 997/17840 [1:36:56<30:07:49, 6.44s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 998/17840 [1:37:03<30:58:08, 6.62s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 998/17840 [1:37:03<30:58:08, 6.62s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:35:08,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 999/17840 [1:37:10<31:29:33, 6.73s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 999/17840 [1:37:10<31:29:33, 6.73s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2838, 'learning_rate': 9.960000000000001e-05, 'epoch': 1.12} + 6%|████▏ | 999/17840 [1:37:10<31:29:33, 6.73s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 999/17840 [1:37:10<31:29:33, 6.73s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1000/17840 [1:37:18<32:32:18, 6.96s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1000/17840 [1:37:18<32:32:18, 6.96s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9924, 'learning_rate': 9.970000000000001e-05, 'epoch': 1.12} + 6%|████ | 1000/17840 [1:37:18<32:32:18, 6.96s/it]g-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:35:24,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:35:24,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4368, 'learning_rate': 9.98e-05, 'epoch': 1.12} +[WARNING|modeling_utils.py:388] 2022-03-18 10:35:24,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:35:24,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:35:24,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:33:44,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1002/17840 [1:37:31<32:19:08, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1002/17840 [1:37:31<32:19:08, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1002/17840 [1:37:31<32:19:08, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:37:38<32:11:28, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:37:38<32:11:28, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.109, 'learning_rate': 0.0001, 'epoch': 1.12} + 6%|████ | 1003/17840 [1:37:38<32:11:28, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:35:44,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:35:44,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5525, 'learning_rate': 9.999406175771971e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-18 10:35:44,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:35:44,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1005/17840 [1:37:52<31:49:33, 6.81s/it]g-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1005/17840 [1:37:52<31:49:33, 6.81s/it]g-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:35:54,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:35:54,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1006/17840 [1:37:58<31:38:05, 6.77s/it]g-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1006/17840 [1:37:58<31:38:05, 6.77s/it]g-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1578, 'learning_rate': 9.998218527315915e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-18 10:36:03,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1007/17840 [1:38:05<31:27:48, 6.73s/it]g-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1007/17840 [1:38:05<31:27:48, 6.73s/it]g-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3036, 'learning_rate': 9.997624703087887e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-18 10:36:09,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1008/17840 [1:38:11<31:11:10, 6.67s/it]g-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1008/17840 [1:38:11<31:11:10, 6.67s/it]g-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3489, 'learning_rate': 9.997030878859858e-05, 'epoch': 1.13} + 6%|████ | 1008/17840 [1:38:11<31:11:10, 6.67s/it]g-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1008/17840 [1:38:11<31:11:10, 6.67s/it]g-point operations will not be computed-18 10:35:32,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1009/17840 [1:38:18<31:03:07, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1009/17840 [1:38:18<31:03:07, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1936, 'learning_rate': 9.99643705463183e-05, 'epoch': 1.13} + 6%|████▏ | 1009/17840 [1:38:18<31:03:07, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1010/17840 [1:38:25<30:55:30, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1010/17840 [1:38:25<30:55:30, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:36:27,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:36:27,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1011/17840 [1:38:31<30:45:46, 6.58s/it]g-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1011/17840 [1:38:31<30:45:46, 6.58s/it]g-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1043, 'learning_rate': 9.995249406175773e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-18 10:36:35,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1012/17840 [1:38:38<30:38:31, 6.56s/it]g-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1012/17840 [1:38:38<30:38:31, 6.56s/it]g-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9048, 'learning_rate': 9.994655581947743e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-18 10:36:42,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1013/17840 [1:38:44<30:21:20, 6.49s/it]g-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1013/17840 [1:38:44<30:21:20, 6.49s/it]g-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9597, 'learning_rate': 9.994061757719715e-05, 'epoch': 1.14} + 6%|████▏ | 1013/17840 [1:38:44<30:21:20, 6.49s/it]g-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:36:50,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:36:50,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9986, 'learning_rate': 9.993467933491687e-05, 'epoch': 1.14} +[WARNING|modeling_utils.py:388] 2022-03-18 10:36:50,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:36:56,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:36:56,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.954, 'learning_rate': 9.992874109263658e-05, 'epoch': 1.14} +[WARNING|modeling_utils.py:388] 2022-03-18 10:36:56,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:36:56,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:36:19,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1016/17840 [1:39:03<29:45:20, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:04,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1016/17840 [1:39:03<29:45:20, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:04,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.227, 'learning_rate': 9.99228028503563e-05, 'epoch': 1.14} + 6%|████▏ | 1016/17840 [1:39:03<29:45:20, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:04,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1017/17840 [1:39:09<29:32:43, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:10,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1017/17840 [1:39:09<29:32:43, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:10,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8684, 'learning_rate': 9.991686460807601e-05, 'epoch': 1.14} + 6%|████▏ | 1017/17840 [1:39:09<29:32:43, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:10,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1018/17840 [1:39:15<29:20:43, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:16,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1018/17840 [1:39:15<29:20:43, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:16,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2141, 'learning_rate': 9.991092636579573e-05, 'epoch': 1.14} + 6%|████▏ | 1018/17840 [1:39:15<29:20:43, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:16,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1019/17840 [1:39:21<29:01:12, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:22,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1019/17840 [1:39:21<29:01:12, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:22,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.03, 'learning_rate': 9.990498812351544e-05, 'epoch': 1.14} + 6%|████▏ | 1019/17840 [1:39:21<29:01:12, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:22,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1019/17840 [1:39:21<29:01:12, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:22,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1020/17840 [1:39:27<28:51:39, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:28,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1020/17840 [1:39:27<28:51:39, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:28,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1020/17840 [1:39:27<28:51:39, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:28,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1020/17840 [1:39:27<28:51:39, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:28,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1021/17840 [1:39:34<28:41:34, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1021/17840 [1:39:34<28:41:34, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:37:39,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:37:39,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.979, 'learning_rate': 9.98871733966746e-05, 'epoch': 1.15} +[WARNING|modeling_utils.py:388] 2022-03-18 10:37:39,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:37:39,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:37:45,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:37:45,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:37:49,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:37:49,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1024/17840 [1:39:51<27:57:29, 5.99s/it]g-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1024/17840 [1:39:51<27:57:29, 5.99s/it]g-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:37:55,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1025/17840 [1:39:58<28:27:46, 6.09s/it]g-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1025/17840 [1:39:58<28:27:46, 6.09s/it]g-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9922, 'learning_rate': 9.986935866983373e-05, 'epoch': 1.15} +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:01,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:01,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1026/17840 [1:40:03<28:01:27, 6.00s/it]g-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:05,923 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:05,923 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:05,923 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:37:34,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1027/17840 [1:40:09<27:18:38, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1027/17840 [1:40:09<27:18:38, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:14,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:14,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1891, 'learning_rate': 9.985154394299288e-05, 'epoch': 1.15} +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:18,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:18,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1029/17840 [1:40:20<26:16:11, 5.63s/it]g-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:22,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:22,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:22,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1030/17840 [1:40:25<25:41:29, 5.50s/it]g-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:27,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:27,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:29,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:29,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:33,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:33,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:10,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1032/17840 [1:40:35<24:20:43, 5.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:38,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:38,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1033/17840 [1:40:40<23:34:05, 5.05s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:41,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:41,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:43,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:45,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:45,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:47,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:49,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:49,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:51,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:53,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:53,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:56,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:58,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:58,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:59,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:38:59,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:02,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:02,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:04,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:04,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:06,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:06,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:07,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:07,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:11,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:11,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:11,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:15,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:18,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:18,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:22,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:22,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2115, 'learning_rate': 9.975653206650832e-05, 'epoch': 1.17} +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:26,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:26,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:26,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1045/17840 [1:41:30<26:46:08, 5.74s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1045/17840 [1:41:30<26:46:08, 5.74s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:35,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:41:37<28:52:19, 6.19s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:41:37<28:52:19, 6.19s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1383, 'learning_rate': 9.974465558194775e-05, 'epoch': 1.17} + 6%|████▎ | 1046/17840 [1:41:37<28:52:19, 6.19s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:41:37<28:52:19, 6.19s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:41:37<28:52:19, 6.19s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1047/17840 [1:41:44<30:10:07, 6.47s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:47,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:47,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1048/17840 [1:41:51<30:59:50, 6.65s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1048/17840 [1:41:51<30:59:50, 6.65s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0163, 'learning_rate': 9.973277909738718e-05, 'epoch': 1.17} + 6%|████▎ | 1048/17840 [1:41:51<30:59:50, 6.65s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:58,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:58,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5938, 'learning_rate': 9.97268408551069e-05, 'epoch': 1.18} +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:58,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:39:58,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1050/17840 [1:42:06<32:33:51, 6.98s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1050/17840 [1:42:06<32:33:51, 6.98s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6165, 'learning_rate': 9.97209026128266e-05, 'epoch': 1.18} + 6%|████▎ | 1050/17840 [1:42:06<32:33:51, 6.98s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1050/17840 [1:42:06<32:33:51, 6.98s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1050/17840 [1:42:06<32:33:51, 6.98s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1051/17840 [1:42:13<32:36:23, 6.99s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:40:16,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:40:16,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1052/17840 [1:42:20<32:25:07, 6.95s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1052/17840 [1:42:20<32:25:07, 6.95s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1979, 'learning_rate': 9.970902612826603e-05, 'epoch': 1.18} +[WARNING|modeling_utils.py:388] 2022-03-18 10:40:24,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1053/17840 [1:42:27<32:14:24, 6.91s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1053/17840 [1:42:27<32:14:24, 6.91s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1921, 'learning_rate': 9.970308788598575e-05, 'epoch': 1.18} + 6%|████▎ | 1053/17840 [1:42:27<32:14:24, 6.91s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1053/17840 [1:42:27<32:14:24, 6.91s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1053/17840 [1:42:27<32:14:24, 6.91s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1054/17840 [1:42:33<32:00:52, 6.87s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:40:36,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:40:36,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1055/17840 [1:42:40<31:47:07, 6.82s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1055/17840 [1:42:40<31:47:07, 6.82s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:40:43,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:40:43,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1056/17840 [1:42:47<31:41:49, 6.80s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1056/17840 [1:42:47<31:41:49, 6.80s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2978, 'learning_rate': 9.96852731591449e-05, 'epoch': 1.18} + 6%|████▎ | 1056/17840 [1:42:47<31:41:49, 6.80s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1056/17840 [1:42:47<31:41:49, 6.80s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1056/17840 [1:42:47<31:41:49, 6.80s/it]g-point operations will not be computed-18 10:38:35,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1057/17840 [1:42:54<31:31:38, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1057/17840 [1:42:54<31:31:38, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1057/17840 [1:42:54<31:31:38, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1057/17840 [1:42:54<31:31:38, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1058/17840 [1:43:00<31:16:49, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:03,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:03,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1059/17840 [1:43:07<31:04:46, 6.67s/it]g-point operations will not be computed-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1059/17840 [1:43:07<31:04:46, 6.67s/it]g-point operations will not be computed-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8067, 'learning_rate': 9.966745843230403e-05, 'epoch': 1.19} +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:11,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1060/17840 [1:43:13<30:53:33, 6.63s/it]g-point operations will not be computed-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1060/17840 [1:43:13<30:53:33, 6.63s/it]g-point operations will not be computed-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2775, 'learning_rate': 9.966152019002377e-05, 'epoch': 1.19} + 6%|████▎ | 1060/17840 [1:43:13<30:53:33, 6.63s/it]g-point operations will not be computed-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:19,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:19,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3614, 'learning_rate': 9.965558194774347e-05, 'epoch': 1.19} +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:19,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:19,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:19,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:40:55,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1062/17840 [1:43:26<30:34:52, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1062/17840 [1:43:26<30:34:52, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1062/17840 [1:43:26<30:34:52, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1063/17840 [1:43:33<30:26:03, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1063/17840 [1:43:33<30:26:03, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:35,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:35,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1064/17840 [1:43:39<30:15:45, 6.49s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1064/17840 [1:43:39<30:15:45, 6.49s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:42,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:42,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1065/17840 [1:43:45<30:06:33, 6.46s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1065/17840 [1:43:45<30:06:33, 6.46s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2268, 'learning_rate': 9.963182897862233e-05, 'epoch': 1.19} +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:49,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1066/17840 [1:43:52<29:57:03, 6.43s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1066/17840 [1:43:52<29:57:03, 6.43s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5751, 'learning_rate': 9.962589073634205e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:56,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:41:56,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1067/17840 [1:43:58<29:48:56, 6.40s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1067/17840 [1:43:58<29:48:56, 6.40s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:02,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:02,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1068/17840 [1:44:04<29:30:48, 6.33s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1068/17840 [1:44:04<29:30:48, 6.33s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1068/17840 [1:44:04<29:30:48, 6.33s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1068/17840 [1:44:04<29:30:48, 6.33s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:10,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:10,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:10,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:10,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:16,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:16,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:20,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1071/17840 [1:44:23<28:41:16, 6.16s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1071/17840 [1:44:23<28:41:16, 6.16s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:26,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:26,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1072/17840 [1:44:29<28:30:29, 6.12s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1072/17840 [1:44:29<28:30:29, 6.12s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:32,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:32,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1073/17840 [1:44:35<28:20:52, 6.09s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:37,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:37,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:37,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1074/17840 [1:44:40<27:57:52, 6.00s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:43,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:43,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:43,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1075/17840 [1:44:47<28:21:15, 6.09s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:49,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:49,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:49,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1076/17840 [1:44:52<27:50:22, 5.98s/it]g-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:55,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:55,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:42:55,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:41:27,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1077/17840 [1:44:58<27:15:03, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:42:59,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1077/17840 [1:44:58<27:15:03, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:42:59,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1077/17840 [1:44:58<27:15:03, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:42:59,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:03,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:42:59,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:05,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:42:59,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:05,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:42:59,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:05,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:42:59,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1079/17840 [1:45:09<26:11:08, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:43:09,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1079/17840 [1:45:09<26:11:08, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:43:09,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:13,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:09,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:13,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:09,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1477, 'learning_rate': 9.954275534441807e-05, 'epoch': 1.21} +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:17,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:09,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:17,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:09,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1081/17840 [1:45:19<24:52:47, 5.34s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:22,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1082/17840 [1:45:24<24:03:56, 5.17s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1082/17840 [1:45:24<24:03:56, 5.17s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:25,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:28,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:28,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:30,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:32,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:32,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:34,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:36,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:36,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:38,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:40,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:40,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:42,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:43,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:43,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:45,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:45,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:48,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:49,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:49,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:52,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:52,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:54,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:54,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:56,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:43:56,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9307, 'learning_rate': 9.947149643705463e-05, 'epoch': 1.22} +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:00,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:00,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:04,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:04,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.421, 'learning_rate': 9.946555819477435e-05, 'epoch': 1.23} +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:08,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:08,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:08,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:11,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:11,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:11,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:19,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:19,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0895, 'learning_rate': 9.945368171021379e-05, 'epoch': 1.23} +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:19,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:19,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:46:27<28:45:41, 6.18s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:46:27<28:45:41, 6.18s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4482, 'learning_rate': 9.94477434679335e-05, 'epoch': 1.23} + 6%|████▍ | 1096/17840 [1:46:27<28:45:41, 6.18s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:33,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:33,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2375, 'learning_rate': 9.94418052256532e-05, 'epoch': 1.23} +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:33,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:33,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1098/17840 [1:46:41<31:02:43, 6.68s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1098/17840 [1:46:41<31:02:43, 6.68s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.261, 'learning_rate': 9.943586698337292e-05, 'epoch': 1.23} +[WARNING|modeling_utils.py:388] 2022-03-18 10:44:45,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:46:48<31:34:42, 6.79s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:46:48<31:34:42, 6.79s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4983, 'learning_rate': 9.942992874109263e-05, 'epoch': 1.23} + 6%|████▍ | 1099/17840 [1:46:48<31:34:42, 6.79s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:46:48<31:34:42, 6.79s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:46:56<32:41:35, 7.03s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:46:56<32:41:35, 7.03s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4558, 'learning_rate': 9.942399049881236e-05, 'epoch': 1.23} + 6%|████▌ | 1100/17840 [1:46:56<32:41:35, 7.03s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:02,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:02,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5209, 'learning_rate': 9.941805225653207e-05, 'epoch': 1.23} +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:02,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:02,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1102/17840 [1:47:10<32:33:55, 7.00s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1102/17840 [1:47:10<32:33:55, 7.00s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0346, 'learning_rate': 9.941211401425179e-05, 'epoch': 1.24} + 6%|████▌ | 1102/17840 [1:47:10<32:33:55, 7.00s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:16,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:16,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1174, 'learning_rate': 9.94061757719715e-05, 'epoch': 1.24} +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:16,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:16,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:16,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1104/17840 [1:47:23<32:13:17, 6.93s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:26,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:26,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:47:30<32:01:07, 6.89s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:47:30<32:01:07, 6.89s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2923, 'learning_rate': 9.939429928741093e-05, 'epoch': 1.24} +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:34,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1106/17840 [1:47:37<31:50:15, 6.85s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1106/17840 [1:47:37<31:50:15, 6.85s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1602, 'learning_rate': 9.938836104513065e-05, 'epoch': 1.24} + 6%|████▌ | 1106/17840 [1:47:37<31:50:15, 6.85s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:43,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:43,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4918, 'learning_rate': 9.938242280285037e-05, 'epoch': 1.24} +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:43,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:43,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:43,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1108/17840 [1:47:50<31:23:07, 6.75s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:53,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:53,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:45:53,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1109/17840 [1:47:57<31:18:50, 6.74s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1109/17840 [1:47:57<31:18:50, 6.74s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:01,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1110/17840 [1:48:03<31:05:20, 6.69s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1110/17840 [1:48:03<31:05:20, 6.69s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2914, 'learning_rate': 9.93646080760095e-05, 'epoch': 1.24} + 6%|████▌ | 1110/17840 [1:48:03<31:05:20, 6.69s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:09,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:09,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1827, 'learning_rate': 9.935866983372922e-05, 'epoch': 1.25} +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:09,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:09,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:09,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1112/17840 [1:48:16<30:41:39, 6.61s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:19,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:19,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:19,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1113/17840 [1:48:23<30:31:12, 6.57s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:25,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:25,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:25,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1114/17840 [1:48:29<30:18:37, 6.52s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1114/17840 [1:48:29<30:18:37, 6.52s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:33,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:33,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1115/17840 [1:48:36<30:12:33, 6.50s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1115/17840 [1:48:36<30:12:33, 6.50s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:40,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1116/17840 [1:48:42<30:04:48, 6.48s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1116/17840 [1:48:42<30:04:48, 6.48s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1639, 'learning_rate': 9.93289786223278e-05, 'epoch': 1.25} + 6%|████▌ | 1116/17840 [1:48:42<30:04:48, 6.48s/it]g-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:48,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:48,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3579, 'learning_rate': 9.932304038004752e-05, 'epoch': 1.25} +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:48,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:48,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:46:48,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:43:20,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1118/17840 [1:48:55<29:41:06, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:46:56,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1118/17840 [1:48:55<29:41:06, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:46:56,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1118/17840 [1:48:55<29:41:06, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:46:56,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1118/17840 [1:48:55<29:41:06, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:46:56,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1119/17840 [1:49:01<29:25:47, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:47:02,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1119/17840 [1:49:01<29:25:47, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:47:02,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1119/17840 [1:49:01<29:25:47, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:47:02,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1119/17840 [1:49:01<29:25:47, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:47:02,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1120/17840 [1:49:07<29:14:06, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:47:08,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1120/17840 [1:49:07<29:14:06, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:47:08,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1120/17840 [1:49:07<29:14:06, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:47:08,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1120/17840 [1:49:07<29:14:06, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:47:08,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1121/17840 [1:49:13<28:52:25, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:47:14,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1121/17840 [1:49:13<28:52:25, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:47:14,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:18,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:14,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:18,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:14,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2633, 'learning_rate': 9.929334916864609e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:18,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:14,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:24,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:14,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:24,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:14,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2973, 'learning_rate': 9.92874109263658e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:24,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:14,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:30,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:14,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:30,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:14,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0879, 'learning_rate': 9.928147268408552e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:30,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:14,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:30,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:14,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:30,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:14,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1125/17840 [1:49:38<28:25:54, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1125/17840 [1:49:38<28:25:54, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:42,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:42,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0588, 'learning_rate': 9.926959619952494e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:47,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:47,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1127/17840 [1:49:49<27:09:49, 5.85s/it]g-point operations will not be computed-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:51,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:53,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:53,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4481, 'learning_rate': 9.925771971496437e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-18 10:47:57,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1129/17840 [1:49:59<26:03:50, 5.61s/it]g-point operations will not be computed-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1129/17840 [1:49:59<26:03:50, 5.61s/it]g-point operations will not be computed-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:01,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:01,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:01,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:47:38,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1130/17840 [1:50:05<25:25:05, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:05,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:08,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:48:05,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1131/17840 [1:50:10<24:47:14, 5.34s/it]g-point operations will not be computed-18 10:48:05,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1131/17840 [1:50:10<24:47:14, 5.34s/it]g-point operations will not be computed-18 10:48:05,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:11,866 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:48:05,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:14,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:48:05,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:14,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:48:05,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9164, 'learning_rate': 9.923396674584323e-05, 'epoch': 1.27} +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:17,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:48:05,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1133/17840 [1:50:19<23:06:05, 4.98s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:19,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1133/17840 [1:50:19<23:06:05, 4.98s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:19,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:21,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:48:19,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1134/17840 [1:50:23<22:03:52, 4.75s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:24,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1134/17840 [1:50:23<22:03:52, 4.75s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:24,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:25,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:48:24,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:25,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:48:24,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1135/17840 [1:50:27<20:49:25, 4.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:27,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:29,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:48:27,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:29,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:48:27,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1136/17840 [1:50:31<19:32:24, 4.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:31,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1137/17840 [1:50:34<18:15:08, 3.93s/it]g-point operations will not be computed-18 10:48:31,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1137/17840 [1:50:34<18:15:08, 3.93s/it]g-point operations will not be computed-18 10:48:31,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:35,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:48:34,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:35,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:48:34,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1138/17840 [1:50:37<16:51:43, 3.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:37,326 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1139/17840 [1:50:39<15:26:45, 3.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:39,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1139/17840 [1:50:39<15:26:45, 3.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:39,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1140/17840 [1:50:42<14:11:41, 3.06s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:42,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1140/17840 [1:50:42<14:11:41, 3.06s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:42,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1141/17840 [1:50:44<12:59:28, 2.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:44,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1141/17840 [1:50:44<12:59:28, 2.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:44,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1142/17840 [1:50:46<11:50:17, 2.55s/it]g-point operations will not be computed-18 10:48:44,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1142/17840 [1:50:46<11:50:17, 2.55s/it]g-point operations will not be computed-18 10:48:44,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1142/17840 [1:50:46<11:50:17, 2.55s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:47,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1142/17840 [1:50:46<11:50:17, 2.55s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:47,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:48:51,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:48:47,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1143/17840 [1:50:54<18:46:19, 4.05s/it]g-point operations will not be computed-18 10:48:47,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1143/17840 [1:50:54<18:46:19, 4.05s/it]g-point operations will not be computed-18 10:48:47,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1143/17840 [1:50:54<18:46:19, 4.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:55,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1143/17840 [1:50:54<18:46:19, 4.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:48:55,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1144/17840 [1:51:01<23:20:57, 5.03s/it]g-point operations will not be computed-18 10:48:55,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1144/17840 [1:51:01<23:20:57, 5.03s/it]g-point operations will not be computed-18 10:48:55,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1144/17840 [1:51:01<23:20:57, 5.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1144/17840 [1:51:01<23:20:57, 5.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:49:06,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:51:08<26:26:45, 5.70s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:51:08<26:26:45, 5.70s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4944, 'learning_rate': 9.915676959619952e-05, 'epoch': 1.28} + 6%|████▋ | 1145/17840 [1:51:08<26:26:45, 5.70s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:49:15,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:49:15,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1921, 'learning_rate': 9.915083135391924e-05, 'epoch': 1.28} +[WARNING|modeling_utils.py:388] 2022-03-18 10:49:15,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:49:15,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1147/17840 [1:51:22<29:45:54, 6.42s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1147/17840 [1:51:22<29:45:54, 6.42s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1756, 'learning_rate': 9.914489311163896e-05, 'epoch': 1.29} +[WARNING|modeling_utils.py:388] 2022-03-18 10:49:27,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.979, 'learning_rate': 9.913895486935868e-05, 'epoch': 1.29} + g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1149/17840 [1:51:37<31:17:24, 6.75s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1149/17840 [1:51:37<31:17:24, 6.75s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4141, 'learning_rate': 9.913301662707839e-05, 'epoch': 1.29} +[WARNING|modeling_utils.py:388] 2022-03-18 10:49:41,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:51:44<32:23:06, 6.99s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:51:44<32:23:06, 6.99s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.075, 'learning_rate': 9.91270783847981e-05, 'epoch': 1.29} + 6%|████▋ | 1150/17840 [1:51:44<32:23:06, 6.99s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:51:44<32:23:06, 6.99s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:51:44<32:23:06, 6.99s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:51:51<32:22:44, 6.98s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:51:51<32:22:44, 6.98s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:49:55,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:49:55,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:51:58<32:14:01, 6.95s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:51:58<32:14:01, 6.95s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:51:58<32:14:01, 6.95s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:51:58<32:14:01, 6.95s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:51:58<32:14:01, 6.95s/it]g-point operations will not be computed-18 10:49:02,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1153/17840 [1:52:05<31:57:49, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1153/17840 [1:52:05<31:57:49, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1153/17840 [1:52:05<31:57:49, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1153/17840 [1:52:05<31:57:49, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1154/17840 [1:52:11<31:45:20, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:14,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:14,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:14,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1155/17840 [1:52:18<31:35:36, 6.82s/it]g-point operations will not be computed-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1155/17840 [1:52:18<31:35:36, 6.82s/it]g-point operations will not be computed-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1155/17840 [1:52:18<31:35:36, 6.82s/it]g-point operations will not be computed-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:24,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:24,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9513, 'learning_rate': 9.909144893111639e-05, 'epoch': 1.3} +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:24,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:24,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:24,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:06,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1157/17840 [1:52:32<31:14:41, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1157/17840 [1:52:32<31:14:41, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1157/17840 [1:52:32<31:14:41, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1157/17840 [1:52:32<31:14:41, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1158/17840 [1:52:38<31:01:43, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:41,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:41,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:41,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1159/17840 [1:52:45<30:51:08, 6.66s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1159/17840 [1:52:45<30:51:08, 6.66s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1159/17840 [1:52:45<30:51:08, 6.66s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:51,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:51,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9434, 'learning_rate': 9.906769596199526e-05, 'epoch': 1.3} +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:51,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:57,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:57,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9876, 'learning_rate': 9.906175771971497e-05, 'epoch': 1.3} +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:57,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:57,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:50:57,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1162/17840 [1:53:04<30:24:45, 6.56s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:07,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:07,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:07,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1163/17840 [1:53:11<30:13:53, 6.53s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:13,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:13,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:13,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1164/17840 [1:53:17<30:05:09, 6.49s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:20,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:20,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:20,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1165/17840 [1:53:24<29:52:01, 6.45s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:26,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:26,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1166/17840 [1:53:30<29:42:08, 6.41s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1166/17840 [1:53:30<29:42:08, 6.41s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.091, 'learning_rate': 9.903206650831354e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:34,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1167/17840 [1:53:36<29:40:04, 6.41s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1167/17840 [1:53:36<29:40:04, 6.41s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1602, 'learning_rate': 9.902612826603326e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:40,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1168/17840 [1:53:42<29:24:24, 6.35s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1168/17840 [1:53:42<29:24:24, 6.35s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0634, 'learning_rate': 9.902019002375298e-05, 'epoch': 1.31} + 7%|████▊ | 1168/17840 [1:53:42<29:24:24, 6.35s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:48,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:48,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2515, 'learning_rate': 9.901425178147269e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:48,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:54,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:54,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1793, 'learning_rate': 9.90083135391924e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-18 10:51:59,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1171/17840 [1:54:01<28:34:53, 6.17s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1171/17840 [1:54:01<28:34:53, 6.17s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6485, 'learning_rate': 9.900237529691212e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:05,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1172/17840 [1:54:07<28:26:32, 6.14s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1172/17840 [1:54:07<28:26:32, 6.14s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5801, 'learning_rate': 9.899643705463182e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:11,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1173/17840 [1:54:13<28:11:07, 6.09s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1173/17840 [1:54:13<28:11:07, 6.09s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3055, 'learning_rate': 9.899049881235156e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:16,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1174/17840 [1:54:19<27:51:37, 6.02s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1174/17840 [1:54:19<27:51:37, 6.02s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:21,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:21,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1175/17840 [1:54:25<28:12:03, 6.09s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1175/17840 [1:54:25<28:12:03, 6.09s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:27,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:27,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:27,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1176/17840 [1:54:31<27:42:08, 5.98s/it]g-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:33,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:33,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:33,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:50:33,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1177/17840 [1:54:36<27:06:40, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:52:37,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1177/17840 [1:54:36<27:06:40, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:52:37,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:41,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:37,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:41,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:37,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1936, 'learning_rate': 9.896080760095012e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:41,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:37,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:46,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:37,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:46,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:37,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:49,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:37,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:49,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:37,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:49,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:37,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1180/17840 [1:54:52<25:31:07, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:52:53,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:55,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:53,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1181/17840 [1:54:57<24:46:57, 5.36s/it]g-point operations will not be computed-18 10:52:53,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1181/17840 [1:54:57<24:46:57, 5.36s/it]g-point operations will not be computed-18 10:52:53,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:52:59,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:53,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:01,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:53,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:01,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:53,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:03,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:53,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:06,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:53,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:06,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:53,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:08,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:53,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:08,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:53,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:08,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:52:53,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1184/17840 [1:55:11<21:54:26, 4.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:53:11,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1185/17840 [1:55:15<20:42:45, 4.48s/it]g-point operations will not be computed-18 10:53:11,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1185/17840 [1:55:15<20:42:45, 4.48s/it]g-point operations will not be computed-18 10:53:11,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1185/17840 [1:55:15<20:42:45, 4.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:53:15,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1186/17840 [1:55:18<19:30:20, 4.22s/it]g-point operations will not be computed-18 10:53:15,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1186/17840 [1:55:18<19:30:20, 4.22s/it]g-point operations will not be computed-18 10:53:15,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:20,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:18,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1187/17840 [1:55:21<18:11:27, 3.93s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:53:21,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1187/17840 [1:55:21<18:11:27, 3.93s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:53:21,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1188/17840 [1:55:24<16:47:54, 3.63s/it]g-point operations will not be computed-18 10:53:21,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1188/17840 [1:55:24<16:47:54, 3.63s/it]g-point operations will not be computed-18 10:53:21,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:26,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:24,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:26,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:24,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:28,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:27,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1190/17840 [1:55:29<14:12:14, 3.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:53:29,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1190/17840 [1:55:29<14:12:14, 3.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:53:29,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1191/17840 [1:55:32<12:54:03, 2.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:53:31,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1191/17840 [1:55:32<12:54:03, 2.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:53:31,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1192/17840 [1:55:34<11:38:39, 2.52s/it]g-point operations will not be computed-18 10:53:31,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1192/17840 [1:55:34<11:38:39, 2.52s/it]g-point operations will not be computed-18 10:53:31,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1192/17840 [1:55:34<11:38:39, 2.52s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:53:35,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1192/17840 [1:55:34<11:38:39, 2.52s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:53:35,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:38,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:35,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:38,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:35,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1193/17840 [1:55:41<18:48:38, 4.07s/it]g-point operations will not be computed-18 10:53:35,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1193/17840 [1:55:41<18:48:38, 4.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:53:42,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:46,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:42,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1194/17840 [1:55:49<23:28:30, 5.08s/it]g-point operations will not be computed-18 10:53:42,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1194/17840 [1:55:49<23:28:30, 5.08s/it]g-point operations will not be computed-18 10:53:42,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1194/17840 [1:55:49<23:28:30, 5.08s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1194/17840 [1:55:49<23:28:30, 5.08s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:53,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:53:53,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1195/17840 [1:55:56<26:36:22, 5.75s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1195/17840 [1:55:56<26:36:22, 5.75s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1195/17840 [1:55:56<26:36:22, 5.75s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:02,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:02,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3373, 'learning_rate': 9.885391923990499e-05, 'epoch': 1.34} +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:02,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:02,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1197/17840 [1:56:10<29:56:39, 6.48s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1197/17840 [1:56:10<29:56:39, 6.48s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.156, 'learning_rate': 9.884798099762471e-05, 'epoch': 1.34} + 7%|████▉ | 1197/17840 [1:56:10<29:56:39, 6.48s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:17,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:17,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3351, 'learning_rate': 9.884204275534442e-05, 'epoch': 1.34} +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:17,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:17,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1199/17840 [1:56:24<31:17:52, 6.77s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1199/17840 [1:56:24<31:17:52, 6.77s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2694, 'learning_rate': 9.883610451306414e-05, 'epoch': 1.34} +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:29,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1200/17840 [1:56:32<32:10:38, 6.96s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1200/17840 [1:56:32<32:10:38, 6.96s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1195, 'learning_rate': 9.883016627078386e-05, 'epoch': 1.35} + 7%|████▉ | 1200/17840 [1:56:32<32:10:38, 6.96s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1200/17840 [1:56:32<32:10:38, 6.96s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1201/17840 [1:56:39<32:21:41, 7.00s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1201/17840 [1:56:39<32:21:41, 7.00s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1605, 'learning_rate': 9.882422802850356e-05, 'epoch': 1.35} + 7%|████▉ | 1201/17840 [1:56:39<32:21:41, 7.00s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:45,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:45,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4512, 'learning_rate': 9.881828978622329e-05, 'epoch': 1.35} +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:45,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:45,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:45,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1203/17840 [1:56:53<32:09:34, 6.96s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:55,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:54:55,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1204/17840 [1:57:00<31:55:57, 6.91s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1204/17840 [1:57:00<31:55:57, 6.91s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.123, 'learning_rate': 9.880641330166271e-05, 'epoch': 1.35} + 7%|████▉ | 1204/17840 [1:57:00<31:55:57, 6.91s/it]g-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:06,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:06,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1022, 'learning_rate': 9.880047505938242e-05, 'epoch': 1.35} +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:06,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:06,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:53:50,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1206/17840 [1:57:13<31:34:36, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1206/17840 [1:57:13<31:34:36, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5244, 'learning_rate': 9.879453681710214e-05, 'epoch': 1.35} + 7%|████▉ | 1206/17840 [1:57:13<31:34:36, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1207/17840 [1:57:20<31:16:17, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1207/17840 [1:57:20<31:16:17, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4598, 'learning_rate': 9.878859857482186e-05, 'epoch': 1.35} +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:24,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1208/17840 [1:57:26<31:03:55, 6.72s/it]g-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1208/17840 [1:57:26<31:03:55, 6.72s/it]g-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3939, 'learning_rate': 9.878266033254158e-05, 'epoch': 1.35} + 7%|████▉ | 1208/17840 [1:57:26<31:03:55, 6.72s/it]g-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1208/17840 [1:57:26<31:03:55, 6.72s/it]g-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:32,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:32,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:32,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:39,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:39,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4983, 'learning_rate': 9.877078384798101e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:39,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:39,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:39,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1211/17840 [1:57:46<30:32:28, 6.61s/it]g-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:49,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:49,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:49,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1212/17840 [1:57:53<30:26:47, 6.59s/it]g-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:55:55,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1213/17840 [1:57:59<30:17:32, 6.56s/it]g-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1213/17840 [1:57:59<30:17:32, 6.56s/it]g-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:56:03,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1214/17840 [1:58:06<30:08:41, 6.53s/it]g-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1214/17840 [1:58:06<30:08:41, 6.53s/it]g-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1636, 'learning_rate': 9.874703087885986e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-18 10:56:10,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1215/17840 [1:58:12<29:57:09, 6.49s/it]g-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1215/17840 [1:58:12<29:57:09, 6.49s/it]g-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.216, 'learning_rate': 9.874109263657958e-05, 'epoch': 1.36} + 7%|████▉ | 1215/17840 [1:58:12<29:57:09, 6.49s/it]g-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:56:18,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:56:18,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1344, 'learning_rate': 9.873515439429929e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-18 10:56:18,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:56:18,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:56:18,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:55:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1217/17840 [1:58:25<29:40:14, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:26,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1217/17840 [1:58:25<29:40:14, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:26,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1217/17840 [1:58:25<29:40:14, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:26,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1217/17840 [1:58:25<29:40:14, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:26,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1218/17840 [1:58:31<29:23:41, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:26,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:56:33,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:56:26,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:56:33,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:56:26,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:56:33,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:56:26,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1219/17840 [1:58:37<29:09:00, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:38,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1219/17840 [1:58:37<29:09:00, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:38,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1219/17840 [1:58:37<29:09:00, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:38,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1219/17840 [1:58:37<29:09:00, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:38,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1220/17840 [1:58:43<29:00:23, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1220/17840 [1:58:43<29:00:23, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1220/17840 [1:58:43<29:00:23, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1220/17840 [1:58:43<29:00:23, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:44,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1221/17840 [1:58:49<28:48:02, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:50,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1221/17840 [1:58:49<28:48:02, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:50,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1221/17840 [1:58:49<28:48:02, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:50,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1221/17840 [1:58:49<28:48:02, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:50,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1222/17840 [1:58:55<28:32:21, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:56:50,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:56:58,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:56:50,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:01,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:56:50,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:01,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:56:50,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1748, 'learning_rate': 9.869358669833729e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:04,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:56:50,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:04,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:56:50,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:04,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:56:50,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1224/17840 [1:59:07<27:59:49, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:57:08,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1224/17840 [1:59:07<27:59:49, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:57:08,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1224/17840 [1:59:07<27:59:49, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:57:08,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1224/17840 [1:59:07<27:59:49, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:57:08,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1225/17840 [1:59:14<28:22:18, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:57:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1225/17840 [1:59:14<28:22:18, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:57:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:19,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:19,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3256, 'learning_rate': 9.867577197149644e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:19,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:24,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:24,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1795, 'learning_rate': 9.866983372921616e-05, 'epoch': 1.38} +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:29,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1228/17840 [1:59:31<26:48:45, 5.81s/it]g-point operations will not be computed-18 10:57:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1228/17840 [1:59:31<26:48:45, 5.81s/it]g-point operations will not be computed-18 10:57:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:33,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:33,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:33,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1229/17840 [1:59:36<26:19:22, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:57:37,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1229/17840 [1:59:36<26:19:22, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:57:37,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:41,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:37,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:41,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:37,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8996, 'learning_rate': 9.86520190023753e-05, 'epoch': 1.38} +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:45,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:37,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:45,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:37,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1231/17840 [1:59:47<25:18:58, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:57:47,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1231/17840 [1:59:47<25:18:58, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:57:47,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:51,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:47,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:51,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:47,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:53,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:47,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:56,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:47,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:56,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:47,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1525, 'learning_rate': 9.863420427553445e-05, 'epoch': 1.38} +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:59,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:47,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:57:59,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:57:47,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1234/17840 [2:00:01<22:47:16, 4.94s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:58:01,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:03,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:01,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:03,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:01,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1235/17840 [2:00:05<21:37:31, 4.69s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:58:05,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1236/17840 [2:00:09<20:24:41, 4.43s/it]g-point operations will not be computed-18 10:58:05,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1236/17840 [2:00:09<20:24:41, 4.43s/it]g-point operations will not be computed-18 10:58:05,787 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1236/17840 [2:00:09<20:24:41, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:58:09,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1237/17840 [2:00:12<19:07:18, 4.15s/it]g-point operations will not be computed-18 10:58:09,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1237/17840 [2:00:12<19:07:18, 4.15s/it]g-point operations will not be computed-18 10:58:09,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:14,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:12,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1238/17840 [2:00:15<17:47:20, 3.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:58:16,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1238/17840 [2:00:15<17:47:20, 3.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:58:16,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1239/17840 [2:00:18<16:26:48, 3.57s/it]g-point operations will not be computed-18 10:58:16,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1239/17840 [2:00:18<16:26:48, 3.57s/it]g-point operations will not be computed-18 10:58:16,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:20,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:18,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:20,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:18,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:22,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:21,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:24,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:23,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:24,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:23,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1242/17840 [2:00:25<12:28:08, 2.70s/it]g-point operations will not be computed-18 10:58:23,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1242/17840 [2:00:25<12:28:08, 2.70s/it]g-point operations will not be computed-18 10:58:23,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1242/17840 [2:00:25<12:28:08, 2.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:58:27,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:30,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:27,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1243/17840 [2:00:33<19:35:01, 4.25s/it]g-point operations will not be computed-18 10:58:27,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1243/17840 [2:00:33<19:35:01, 4.25s/it]g-point operations will not be computed-18 10:58:27,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1243/17840 [2:00:33<19:35:01, 4.25s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:58:34,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1243/17840 [2:00:33<19:35:01, 4.25s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:58:34,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:38,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:34,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1244/17840 [2:00:41<23:55:15, 5.19s/it]g-point operations will not be computed-18 10:58:34,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1244/17840 [2:00:41<23:55:15, 5.19s/it]g-point operations will not be computed-18 10:58:34,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1244/17840 [2:00:41<23:55:15, 5.19s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1244/17840 [2:00:41<23:55:15, 5.19s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1244/17840 [2:00:41<23:55:15, 5.19s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:47,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:47,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:47,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:47,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:58:47,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1246/17840 [2:00:55<28:36:24, 6.21s/it]g-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1246/17840 [2:00:55<28:36:24, 6.21s/it]g-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1246/17840 [2:00:55<28:36:24, 6.21s/it]g-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:01,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:01,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3852, 'learning_rate': 9.855106888361046e-05, 'epoch': 1.4} +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:01,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:01,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:01,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1248/17840 [2:01:09<30:44:50, 6.67s/it]g-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:12,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:12,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:12,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [2:01:16<31:11:45, 6.77s/it]g-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [2:01:16<31:11:45, 6.77s/it]g-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [2:01:16<31:11:45, 6.77s/it]g-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [2:01:16<31:11:45, 6.77s/it]g-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [2:01:16<31:11:45, 6.77s/it]g-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:01:24<32:18:03, 7.01s/it]g-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:01:24<32:18:03, 7.01s/it]g-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:01:24<32:18:03, 7.01s/it]g-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:01:24<32:18:03, 7.01s/it]g-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [2:01:24<32:18:03, 7.01s/it]g-point operations will not be computed-18 10:58:42,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1251/17840 [2:01:31<32:24:12, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1251/17840 [2:01:31<32:24:12, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1251/17840 [2:01:31<32:24:12, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1251/17840 [2:01:31<32:24:12, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1252/17840 [2:01:38<32:27:05, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1252/17840 [2:01:38<32:27:05, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1252/17840 [2:01:38<32:27:05, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:44,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:44,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3583, 'learning_rate': 9.851543942992875e-05, 'epoch': 1.4} +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:44,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:44,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:44,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1254/17840 [2:01:52<31:56:30, 6.93s/it]g-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1254/17840 [2:01:52<31:56:30, 6.93s/it]g-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:56,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 10:59:56,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1255/17840 [2:01:58<31:37:35, 6.86s/it]g-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1255/17840 [2:01:58<31:37:35, 6.86s/it]g-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1255/17840 [2:01:58<31:37:35, 6.86s/it]g-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:04,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:04,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8916, 'learning_rate': 9.849762470308789e-05, 'epoch': 1.41} +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:04,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:04,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:04,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 10:59:32,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1257/17840 [2:02:12<31:22:00, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1257/17840 [2:02:12<31:22:00, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1257/17840 [2:02:12<31:22:00, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1257/17840 [2:02:12<31:22:00, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1258/17840 [2:02:18<31:09:54, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:21,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:21,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1259/17840 [2:02:25<31:01:31, 6.74s/it]g-point operations will not be computed-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1259/17840 [2:02:25<31:01:31, 6.74s/it]g-point operations will not be computed-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1184, 'learning_rate': 9.847980997624703e-05, 'epoch': 1.41} +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:29,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1260/17840 [2:02:32<30:51:27, 6.70s/it]g-point operations will not be computed-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1260/17840 [2:02:32<30:51:27, 6.70s/it]g-point operations will not be computed-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2789, 'learning_rate': 9.847387173396675e-05, 'epoch': 1.41} + 7%|█████▏ | 1260/17840 [2:02:32<30:51:27, 6.70s/it]g-point operations will not be computed-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:38,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:38,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3328, 'learning_rate': 9.846793349168647e-05, 'epoch': 1.41} +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:38,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:38,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:38,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:13,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1262/17840 [2:02:45<30:36:41, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1262/17840 [2:02:45<30:36:41, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1262/17840 [2:02:45<30:36:41, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1262/17840 [2:02:45<30:36:41, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1263/17840 [2:02:51<30:27:13, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:54,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:00:54,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1264/17840 [2:02:58<30:11:18, 6.56s/it]g-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1264/17840 [2:02:58<30:11:18, 6.56s/it]g-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.984, 'learning_rate': 9.845011876484561e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:02,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1265/17840 [2:03:04<29:48:00, 6.47s/it]g-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1265/17840 [2:03:04<29:48:00, 6.47s/it]g-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2353, 'learning_rate': 9.844418052256532e-05, 'epoch': 1.42} + 7%|█████▏ | 1265/17840 [2:03:04<29:48:00, 6.47s/it]g-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:10,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:10,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3328, 'learning_rate': 9.843824228028504e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:10,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:16,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:16,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9992, 'learning_rate': 9.843230403800476e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:16,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:22,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:22,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1601, 'learning_rate': 9.842636579572448e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:22,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:28,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:28,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2037, 'learning_rate': 9.842042755344418e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:28,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:35,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:35,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1816, 'learning_rate': 9.84144893111639e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:35,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:41,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:41,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0193, 'learning_rate': 9.840855106888361e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:41,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:47,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:47,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0829, 'learning_rate': 9.840261282660333e-05, 'epoch': 1.43} +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:47,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:53,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:53,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:53,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.213, 'learning_rate': 9.839667458432305e-05, 'epoch': 1.43} +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:53,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:59,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:59,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:59,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:01:59,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:05,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:05,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:05,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:05,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:11,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:11,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:16,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:16,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1277/17840 [2:04:18<27:31:00, 5.98s/it]g-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:20,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:20,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:20,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:00:46,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1278/17840 [2:04:23<26:49:41, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:02:24,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1278/17840 [2:04:23<26:49:41, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:02:24,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:28,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:24,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:28,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:24,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.262, 'learning_rate': 9.836104513064133e-05, 'epoch': 1.43} +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:32,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:24,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:32,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:24,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1280/17840 [2:04:34<25:45:54, 5.60s/it]g-point operations will not be computed-18 11:02:24,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:36,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:24,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:36,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:24,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:36,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:24,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1281/17840 [2:04:39<25:16:46, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:02:40,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:42,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:40,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:42,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:40,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1282/17840 [2:04:44<24:36:24, 5.35s/it]g-point operations will not be computed-18 11:02:40,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:46,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:40,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:48,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:40,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:48,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:40,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2226, 'learning_rate': 9.833729216152019e-05, 'epoch': 1.44} +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:52,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:40,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:52,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:40,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1284/17840 [2:04:54<23:12:02, 5.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:02:54,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:56,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:54,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:02:56,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:54,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1285/17840 [2:04:58<22:14:12, 4.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:02:59,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:00,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:59,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:00,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:02:59,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1286/17840 [2:05:02<20:58:34, 4.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:03:02,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:04,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:02,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:04,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:02,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1287/17840 [2:05:06<19:34:13, 4.26s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:03:06,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1288/17840 [2:05:09<18:15:23, 3.97s/it]g-point operations will not be computed-18 11:03:06,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1288/17840 [2:05:09<18:15:23, 3.97s/it]g-point operations will not be computed-18 11:03:06,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:10,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:09,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:10,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:09,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1289/17840 [2:05:12<16:53:04, 3.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:03:12,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1289/17840 [2:05:12<16:53:04, 3.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:03:12,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1290/17840 [2:05:15<15:27:03, 3.36s/it]g-point operations will not be computed-18 11:03:12,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1290/17840 [2:05:15<15:27:03, 3.36s/it]g-point operations will not be computed-18 11:03:12,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1291/17840 [2:05:17<14:00:53, 3.05s/it]g-point operations will not be computed-18 11:03:15,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1291/17840 [2:05:17<14:00:53, 3.05s/it]g-point operations will not be computed-18 11:03:15,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1292/17840 [2:05:19<12:35:53, 2.74s/it]g-point operations will not be computed-18 11:03:17,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1292/17840 [2:05:19<12:35:53, 2.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:03:20,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1292/17840 [2:05:19<12:35:53, 2.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:03:20,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:24,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:20,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:24,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:20,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1293/17840 [2:05:27<19:22:22, 4.21s/it]g-point operations will not be computed-18 11:03:20,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1293/17840 [2:05:27<19:22:22, 4.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1293/17840 [2:05:27<19:22:22, 4.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:31,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:31,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1294/17840 [2:05:34<23:48:55, 5.18s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1294/17840 [2:05:34<23:48:55, 5.18s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1294/17840 [2:05:34<23:48:55, 5.18s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1294/17840 [2:05:34<23:48:55, 5.18s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:41,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:41,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:41,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:41,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:41,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:05:49<28:41:35, 6.24s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:05:49<28:41:35, 6.24s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [2:05:49<28:41:35, 6.24s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:55,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:55,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1208, 'learning_rate': 9.82541567695962e-05, 'epoch': 1.45} +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:55,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:55,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:03:55,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:06:03<30:55:23, 6.73s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:06:03<30:55:23, 6.73s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [2:06:03<30:55:23, 6.73s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:04:09,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:04:09,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1326, 'learning_rate': 9.824228028503563e-05, 'epoch': 1.46} +[WARNING|modeling_utils.py:388] 2022-03-18 11:04:09,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:04:09,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:04:09,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1300/17840 [2:06:18<32:20:58, 7.04s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1300/17840 [2:06:18<32:20:58, 7.04s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1300/17840 [2:06:18<32:20:58, 7.04s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1300/17840 [2:06:18<32:20:58, 7.04s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1300/17840 [2:06:18<32:20:58, 7.04s/it]g-point operations will not be computed-18 11:03:28,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [2:06:25<32:24:39, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:04:26,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [2:06:25<32:24:39, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:04:26,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [2:06:25<32:24:39, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:04:26,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [2:06:25<32:24:39, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:04:26,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1302/17840 [2:06:32<32:24:33, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:04:26,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1302/17840 [2:06:32<32:24:33, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:04:26,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1302/17840 [2:06:32<32:24:33, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:04:26,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:04:38,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:26,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:04:38,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:26,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3205, 'learning_rate': 9.82185273159145e-05, 'epoch': 1.46} +[WARNING|modeling_utils.py:388] 2022-03-18 11:04:38,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:26,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:04:38,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:26,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:04:38,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:26,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1304/17840 [2:06:46<32:01:36, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1304/17840 [2:06:46<32:01:36, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1304/17840 [2:06:46<32:01:36, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1304/17840 [2:06:46<32:01:36, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1305/17840 [2:06:52<31:43:29, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1305/17840 [2:06:52<31:43:29, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:04:57,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [2:06:59<31:35:34, 6.88s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [2:06:59<31:35:34, 6.88s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0093, 'learning_rate': 9.820071258907365e-05, 'epoch': 1.46} + 7%|█████▎ | 1306/17840 [2:06:59<31:35:34, 6.88s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [2:06:59<31:35:34, 6.88s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [2:06:59<31:35:34, 6.88s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1307/17840 [2:07:06<31:24:32, 6.84s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:08,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:08,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:08,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1308/17840 [2:07:13<31:14:46, 6.80s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1308/17840 [2:07:13<31:14:46, 6.80s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:17,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1309/17840 [2:07:19<30:56:38, 6.74s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1309/17840 [2:07:19<30:56:38, 6.74s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0986, 'learning_rate': 9.818289786223278e-05, 'epoch': 1.47} + 7%|█████▎ | 1309/17840 [2:07:19<30:56:38, 6.74s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:25,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:25,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2681, 'learning_rate': 9.81769596199525e-05, 'epoch': 1.47} +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:25,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:25,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:25,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1311/17840 [2:07:32<30:25:15, 6.63s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:35,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:35,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:35,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1312/17840 [2:07:39<30:13:08, 6.58s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1312/17840 [2:07:39<30:13:08, 6.58s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:43,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:43,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1313/17840 [2:07:45<30:05:52, 6.56s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1313/17840 [2:07:45<30:05:52, 6.56s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:49,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1314/17840 [2:07:52<29:57:51, 6.53s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1314/17840 [2:07:52<29:57:51, 6.53s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9766, 'learning_rate': 9.815320665083137e-05, 'epoch': 1.47} + 7%|█████▍ | 1314/17840 [2:07:52<29:57:51, 6.53s/it]g-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:57,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:57,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.09, 'learning_rate': 9.814726840855108e-05, 'epoch': 1.47} +[WARNING|modeling_utils.py:388] 2022-03-18 11:05:57,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:04,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:04,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1104, 'learning_rate': 9.814133016627078e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:04,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:10,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:10,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4462, 'learning_rate': 9.81353919239905e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:10,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:10,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:10,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:04:46,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1318/17840 [2:08:17<29:11:51, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:06:18,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1318/17840 [2:08:17<29:11:51, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:06:18,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1318/17840 [2:08:17<29:11:51, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:06:18,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1318/17840 [2:08:17<29:11:51, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:06:18,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1319/17840 [2:08:23<28:52:16, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:06:24,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1319/17840 [2:08:23<28:52:16, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:06:24,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1319/17840 [2:08:23<28:52:16, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:06:24,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1319/17840 [2:08:23<28:52:16, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:06:24,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1320/17840 [2:08:29<28:35:43, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:06:30,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1320/17840 [2:08:29<28:35:43, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:06:30,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1320/17840 [2:08:29<28:35:43, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:06:30,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1320/17840 [2:08:29<28:35:43, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:06:30,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1321/17840 [2:08:35<28:29:07, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:06:36,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1321/17840 [2:08:35<28:29:07, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:06:36,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:41,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:06:36,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:41,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:06:36,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4387, 'learning_rate': 9.810570071258908e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:41,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:06:36,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:47,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:06:36,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:47,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:06:36,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2619, 'learning_rate': 9.80997624703088e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:47,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:06:36,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:53,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:06:36,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:53,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:06:36,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2634, 'learning_rate': 9.80938242280285e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:53,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:06:36,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:53,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:06:36,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:06:53,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:06:36,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1325/17840 [2:09:00<28:14:36, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:07:00,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1325/17840 [2:09:00<28:14:36, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:07:00,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:05,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:00,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:05,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:00,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1878, 'learning_rate': 9.808194774346795e-05, 'epoch': 1.49} +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:05,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:00,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:10,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:00,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:10,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:00,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1933, 'learning_rate': 9.807600950118765e-05, 'epoch': 1.49} +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:15,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:00,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1328/17840 [2:09:17<26:43:28, 5.83s/it]g-point operations will not be computed-18 11:07:00,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1328/17840 [2:09:17<26:43:28, 5.83s/it]g-point operations will not be computed-18 11:07:00,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:19,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:00,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:19,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:00,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:19,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:00,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1329/17840 [2:09:22<26:12:11, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:07:23,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:25,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:23,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1330/17840 [2:09:28<25:36:46, 5.58s/it]g-point operations will not be computed-18 11:07:23,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1330/17840 [2:09:28<25:36:46, 5.58s/it]g-point operations will not be computed-18 11:07:23,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:29,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:23,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:29,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:23,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1331/17840 [2:09:33<25:03:15, 5.46s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:07:33,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1331/17840 [2:09:33<25:03:15, 5.46s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:07:33,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:36,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:33,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:36,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:33,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1332/17840 [2:09:38<24:24:55, 5.32s/it]g-point operations will not be computed-18 11:07:33,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:39,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:33,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:39,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:33,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:42,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:33,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:42,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:33,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:45,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:33,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:45,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:33,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1334/17840 [2:09:47<22:24:32, 4.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:07:47,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:49,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:47,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:49,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:47,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1335/17840 [2:09:51<21:12:46, 4.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:07:51,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1335/17840 [2:09:51<21:12:46, 4.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:07:51,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1336/17840 [2:09:54<19:57:09, 4.35s/it]g-point operations will not be computed-18 11:07:51,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1336/17840 [2:09:54<19:57:09, 4.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:07:55,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1336/17840 [2:09:54<19:57:09, 4.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:07:55,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1337/17840 [2:09:58<18:38:06, 4.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:07:58,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:59,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:58,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:07:59,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:07:58,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1338/17840 [2:10:01<17:16:45, 3.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:08:01,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1338/17840 [2:10:01<17:16:45, 3.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:08:01,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1339/17840 [2:10:04<15:59:25, 3.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:08:04,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1339/17840 [2:10:04<15:59:25, 3.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:08:04,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1340/17840 [2:10:06<14:35:19, 3.18s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:08:06,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1340/17840 [2:10:06<14:35:19, 3.18s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:08:06,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1341/17840 [2:10:08<13:15:39, 2.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:08:08,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1341/17840 [2:10:08<13:15:39, 2.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:08:08,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1342/17840 [2:10:10<11:54:39, 2.60s/it]g-point operations will not be computed-18 11:08:08,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1342/17840 [2:10:10<11:54:39, 2.60s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:08:12,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1342/17840 [2:10:10<11:54:39, 2.60s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:08:12,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:08:15,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:12,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:08:15,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:12,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1343/17840 [2:10:18<18:51:11, 4.11s/it]g-point operations will not be computed-18 11:08:12,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1343/17840 [2:10:18<18:51:11, 4.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:08:19,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1343/17840 [2:10:18<18:51:11, 4.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:08:19,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:08:23,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:19,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:08:23,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:19,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1344/17840 [2:10:25<23:22:05, 5.10s/it]g-point operations will not be computed-18 11:08:19,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▍ | 1344/17840 [2:10:25<23:22:05, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:08:30,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:08:30,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1345/17840 [2:10:33<26:26:33, 5.77s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1345/17840 [2:10:33<26:26:33, 5.77s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1345/17840 [2:10:33<26:26:33, 5.77s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1345/17840 [2:10:33<26:26:33, 5.77s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1345/17840 [2:10:33<26:26:33, 5.77s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1346/17840 [2:10:40<28:33:58, 6.23s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1346/17840 [2:10:40<28:33:58, 6.23s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:08:45,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1347/17840 [2:10:47<29:52:53, 6.52s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1347/17840 [2:10:47<29:52:53, 6.52s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0825, 'learning_rate': 9.795724465558195e-05, 'epoch': 1.51} + 8%|█████▌ | 1347/17840 [2:10:47<29:52:53, 6.52s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1347/17840 [2:10:47<29:52:53, 6.52s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1347/17840 [2:10:47<29:52:53, 6.52s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1348/17840 [2:10:54<30:44:04, 6.71s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1348/17840 [2:10:54<30:44:04, 6.71s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:08:59,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [2:11:02<31:22:25, 6.85s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [2:11:02<31:22:25, 6.85s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0921, 'learning_rate': 9.794536817102138e-05, 'epoch': 1.51} + 8%|█████▌ | 1349/17840 [2:11:02<31:22:25, 6.85s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [2:11:02<31:22:25, 6.85s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [2:11:02<31:22:25, 6.85s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [2:11:09<32:13:09, 7.03s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [2:11:09<32:13:09, 7.03s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [2:11:09<32:13:09, 7.03s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:15,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:15,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3422, 'learning_rate': 9.79334916864608e-05, 'epoch': 1.51} +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:15,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:15,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:15,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1352/17840 [2:11:23<32:03:49, 7.00s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1352/17840 [2:11:23<32:03:49, 7.00s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:27,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1353/17840 [2:11:30<31:48:15, 6.94s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1353/17840 [2:11:30<31:48:15, 6.94s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2014, 'learning_rate': 9.792161520190025e-05, 'epoch': 1.52} + 8%|█████▌ | 1353/17840 [2:11:30<31:48:15, 6.94s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:36,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:36,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1206, 'learning_rate': 9.791567695961997e-05, 'epoch': 1.52} +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:36,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:36,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:36,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:11:43<31:31:04, 6.88s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:11:43<31:31:04, 6.88s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:11:43<31:31:04, 6.88s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:49,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:49,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2814, 'learning_rate': 9.790380047505938e-05, 'epoch': 1.52} +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:49,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:56,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:56,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2397, 'learning_rate': 9.78978622327791e-05, 'epoch': 1.52} +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:56,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:56,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:09:56,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1358/17840 [2:12:03<30:52:02, 6.74s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:06,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:06,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:06,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1359/17840 [2:12:10<30:39:34, 6.70s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1359/17840 [2:12:10<30:39:34, 6.70s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:14,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1360/17840 [2:12:17<30:28:59, 6.66s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1360/17840 [2:12:17<30:28:59, 6.66s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9265, 'learning_rate': 9.788004750593825e-05, 'epoch': 1.52} + 8%|█████▌ | 1360/17840 [2:12:17<30:28:59, 6.66s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:22,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:22,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.251, 'learning_rate': 9.787410926365797e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:22,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:29,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:29,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4268, 'learning_rate': 9.786817102137767e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:29,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:29,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:29,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1363/17840 [2:12:36<29:57:19, 6.54s/it]g-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:39,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:39,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:39,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:08:27,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1364/17840 [2:12:43<29:45:15, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1364/17840 [2:12:43<29:45:15, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1364/17840 [2:12:43<29:45:15, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1365/17840 [2:12:49<29:27:17, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1365/17840 [2:12:49<29:27:17, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:51,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:51,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1366/17840 [2:12:55<29:19:37, 6.41s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1366/17840 [2:12:55<29:19:37, 6.41s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2979, 'learning_rate': 9.784441805225654e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-18 11:10:59,598 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1367/17840 [2:13:01<29:06:57, 6.36s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1367/17840 [2:13:01<29:06:57, 6.36s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9388, 'learning_rate': 9.783847980997625e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-18 11:11:05,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1368/17840 [2:13:08<28:52:11, 6.31s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1368/17840 [2:13:08<28:52:11, 6.31s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2286, 'learning_rate': 9.783254156769597e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-18 11:11:11,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1369/17840 [2:13:14<28:39:12, 6.26s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1369/17840 [2:13:14<28:39:12, 6.26s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9412, 'learning_rate': 9.782660332541568e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-18 11:11:18,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1370/17840 [2:13:20<28:27:10, 6.22s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1370/17840 [2:13:20<28:27:10, 6.22s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9699, 'learning_rate': 9.78206650831354e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-18 11:11:24,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1371/17840 [2:13:26<28:19:54, 6.19s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1371/17840 [2:13:26<28:19:54, 6.19s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1272, 'learning_rate': 9.78147268408551e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-18 11:11:30,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1372/17840 [2:13:32<27:59:29, 6.12s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1372/17840 [2:13:32<27:59:29, 6.12s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:11:34,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:11:34,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1373/17840 [2:13:38<27:45:36, 6.07s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1373/17840 [2:13:38<27:45:36, 6.07s/it]g-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:11:40,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:11:40,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:11:40,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:10:43,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1374/17840 [2:13:44<27:27:16, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:11:45,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1374/17840 [2:13:44<27:27:16, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:11:45,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1374/17840 [2:13:44<27:27:16, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:11:45,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1375/17840 [2:13:50<27:39:45, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:11:45,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1375/17840 [2:13:50<27:39:45, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:11:45,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:11:52,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:45,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:11:52,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:45,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:11:52,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:45,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1376/17840 [2:13:56<27:05:59, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1376/17840 [2:13:56<27:05:59, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:00,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:00,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9311, 'learning_rate': 9.77790973871734e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:04,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1378/17840 [2:14:07<26:07:35, 5.71s/it]g-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1378/17840 [2:14:07<26:07:35, 5.71s/it]g-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:09,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:11,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:11,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:11,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:15,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:15,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1380/17840 [2:14:17<25:11:39, 5.51s/it]g-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:19,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:22,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:22,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9434, 'learning_rate': 9.775534441805227e-05, 'epoch': 1.55} +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:25,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1382/17840 [2:14:27<23:57:18, 5.24s/it]g-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1382/17840 [2:14:27<23:57:18, 5.24s/it]g-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:29,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:31,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:31,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:33,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:33,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:35,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:37,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:37,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:39,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:41,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:41,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:43,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:46,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:46,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2997, 'learning_rate': 9.771971496437055e-05, 'epoch': 1.55} +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:49,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:51,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:51,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:53,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:53,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:56,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:56,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:58,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:58,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:59,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:12:59,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:03,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:03,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:03,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:06,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:06,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:10,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:10,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:14,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:14,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:18,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:18,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:18,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1395/17840 [2:15:22<26:28:02, 5.79s/it]g-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1395/17840 [2:15:22<26:28:02, 5.79s/it]g-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1395/17840 [2:15:22<26:28:02, 5.79s/it]g-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1395/17840 [2:15:22<26:28:02, 5.79s/it]g-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1395/17840 [2:15:22<26:28:02, 5.79s/it]g-point operations will not be computed-18 11:11:56,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1396/17840 [2:15:29<28:34:56, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1396/17840 [2:15:29<28:34:56, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1396/17840 [2:15:29<28:34:56, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1396/17840 [2:15:29<28:34:56, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1397/17840 [2:15:37<29:53:44, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1397/17840 [2:15:37<29:53:44, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1397/17840 [2:15:37<29:53:44, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1397/17840 [2:15:37<29:53:44, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1397/17840 [2:15:37<29:53:44, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1398/17840 [2:15:44<30:46:27, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:47,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:47,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:47,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1399/17840 [2:15:51<31:22:55, 6.87s/it]g-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1399/17840 [2:15:51<31:22:55, 6.87s/it]g-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1399/17840 [2:15:51<31:22:55, 6.87s/it]g-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:58,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:13:58,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3197, 'learning_rate': 9.764251781472685e-05, 'epoch': 1.57} +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:01,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:01,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:01,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1401/17840 [2:16:06<32:15:58, 7.07s/it]g-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1401/17840 [2:16:06<32:15:58, 7.07s/it]g-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1401/17840 [2:16:06<32:15:58, 7.07s/it]g-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:12,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:12,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7274, 'learning_rate': 9.763064133016627e-05, 'epoch': 1.57} +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:12,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:12,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:12,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1403/17840 [2:16:19<31:44:07, 6.95s/it]g-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1403/17840 [2:16:19<31:44:07, 6.95s/it]g-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:24,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1404/17840 [2:16:26<31:33:54, 6.91s/it]g-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1404/17840 [2:16:26<31:33:54, 6.91s/it]g-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.621, 'learning_rate': 9.76187648456057e-05, 'epoch': 1.57} + 8%|█████▋ | 1404/17840 [2:16:26<31:33:54, 6.91s/it]g-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:32,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:32,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0283, 'learning_rate': 9.761282660332542e-05, 'epoch': 1.58} +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:32,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:32,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:32,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:13:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:16:40<31:12:07, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:16:40<31:12:07, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:16:40<31:12:07, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1407/17840 [2:16:46<31:04:31, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1407/17840 [2:16:46<31:04:31, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0553, 'learning_rate': 9.760095011876486e-05, 'epoch': 1.58} +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:51,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:16:53<30:52:49, 6.77s/it]g-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:16:53<30:52:49, 6.77s/it]g-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0956, 'learning_rate': 9.759501187648457e-05, 'epoch': 1.58} + 8%|█████▊ | 1408/17840 [2:16:53<30:52:49, 6.77s/it]g-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:59,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:59,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0423, 'learning_rate': 9.758907363420427e-05, 'epoch': 1.58} +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:59,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:59,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:14:59,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1410/17840 [2:17:06<30:31:15, 6.69s/it]g-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:15:09,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:15:09,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1411/17840 [2:17:13<30:21:43, 6.65s/it]g-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1411/17840 [2:17:13<30:21:43, 6.65s/it]g-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.324, 'learning_rate': 9.75771971496437e-05, 'epoch': 1.58} +[WARNING|modeling_utils.py:388] 2022-03-18 11:15:17,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1412/17840 [2:17:19<30:12:52, 6.62s/it]g-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1412/17840 [2:17:19<30:12:52, 6.62s/it]g-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2402, 'learning_rate': 9.757125890736342e-05, 'epoch': 1.58} + 8%|█████▊ | 1412/17840 [2:17:19<30:12:52, 6.62s/it]g-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:15:25,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:15:25,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1274, 'learning_rate': 9.756532066508314e-05, 'epoch': 1.58} +[WARNING|modeling_utils.py:388] 2022-03-18 11:15:25,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:15:25,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:15:25,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:14:41,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1414/17840 [2:17:32<29:53:13, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:15:33,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1414/17840 [2:17:32<29:53:13, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:15:33,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1414/17840 [2:17:32<29:53:13, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:15:33,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1414/17840 [2:17:32<29:53:13, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:15:33,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1415/17840 [2:17:39<29:38:40, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1415/17840 [2:17:39<29:38:40, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1415/17840 [2:17:39<29:38:40, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1415/17840 [2:17:39<29:38:40, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1416/17840 [2:17:45<29:23:48, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:15:47,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:15:47,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1417/17840 [2:17:51<29:16:07, 6.42s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1417/17840 [2:17:51<29:16:07, 6.42s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:15:54,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:15:54,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1418/17840 [2:17:58<29:08:13, 6.39s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1418/17840 [2:17:58<29:08:13, 6.39s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.818, 'learning_rate': 9.75356294536817e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:02,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1419/17840 [2:18:04<29:01:26, 6.36s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1419/17840 [2:18:04<29:01:26, 6.36s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1751, 'learning_rate': 9.752969121140144e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:08,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1420/17840 [2:18:10<28:46:19, 6.31s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1420/17840 [2:18:10<28:46:19, 6.31s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2369, 'learning_rate': 9.752375296912114e-05, 'epoch': 1.59} + 8%|█████▊ | 1420/17840 [2:18:10<28:46:19, 6.31s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:15,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:15,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1609, 'learning_rate': 9.751781472684086e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:15,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:22,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:22,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2007, 'learning_rate': 9.751187648456057e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:22,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:28,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:28,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.074, 'learning_rate': 9.750593824228029e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:32,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1424/17840 [2:18:34<27:53:39, 6.12s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1424/17840 [2:18:34<27:53:39, 6.12s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:37,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:37,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1425/17840 [2:18:41<28:14:37, 6.19s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1425/17840 [2:18:41<28:14:37, 6.19s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0046, 'learning_rate': 9.749406175771972e-05, 'epoch': 1.6} + 8%|█████▊ | 1425/17840 [2:18:41<28:14:37, 6.19s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:46,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:46,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0189, 'learning_rate': 9.748812351543944e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:50,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:50,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1427/17840 [2:18:52<27:18:28, 5.99s/it]g-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:54,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:54,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:16:54,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:15:39,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1428/17840 [2:18:58<26:43:09, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:16:59,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1428/17840 [2:18:58<26:43:09, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:16:59,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:03,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:16:59,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:03,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:16:59,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0465, 'learning_rate': 9.747030878859857e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:07,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:16:59,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1430/17840 [2:19:09<25:35:18, 5.61s/it]g-point operations will not be computed-18 11:16:59,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1430/17840 [2:19:09<25:35:18, 5.61s/it]g-point operations will not be computed-18 11:16:59,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:11,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:16:59,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:11,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:16:59,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:11,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:16:59,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1431/17840 [2:19:14<25:01:42, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:17:14,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:17,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:17:14,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1432/17840 [2:19:19<24:26:12, 5.36s/it]g-point operations will not be computed-18 11:17:14,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1432/17840 [2:19:19<24:26:12, 5.36s/it]g-point operations will not be computed-18 11:17:14,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:21,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:17:14,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:23,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:17:14,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:23,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:17:14,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3779, 'learning_rate': 9.744655581947744e-05, 'epoch': 1.61} +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:26,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:17:14,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:26,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:17:14,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1434/17840 [2:19:28<22:33:25, 4.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:17:29,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:31,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:17:29,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:31,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:17:29,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1435/17840 [2:19:32<21:27:33, 4.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:17:33,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1436/17840 [2:19:36<20:13:12, 4.44s/it]g-point operations will not be computed-18 11:17:33,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1436/17840 [2:19:36<20:13:12, 4.44s/it]g-point operations will not be computed-18 11:17:33,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1436/17840 [2:19:36<20:13:12, 4.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:17:36,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1437/17840 [2:19:40<18:51:38, 4.14s/it]g-point operations will not be computed-18 11:17:36,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1437/17840 [2:19:40<18:51:38, 4.14s/it]g-point operations will not be computed-18 11:17:36,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:41,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:17:40,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:41,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:17:40,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1438/17840 [2:19:43<17:21:32, 3.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:17:43,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1439/17840 [2:19:45<15:57:35, 3.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:17:45,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1439/17840 [2:19:45<15:57:35, 3.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:17:45,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1440/17840 [2:19:48<14:33:56, 3.20s/it]g-point operations will not be computed-18 11:17:45,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1440/17840 [2:19:48<14:33:56, 3.20s/it]g-point operations will not be computed-18 11:17:45,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1441/17840 [2:19:50<13:11:54, 2.90s/it]g-point operations will not be computed-18 11:17:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1441/17840 [2:19:50<13:11:54, 2.90s/it]g-point operations will not be computed-18 11:17:48,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1442/17840 [2:19:52<11:52:55, 2.61s/it]g-point operations will not be computed-18 11:17:50,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1442/17840 [2:19:52<11:52:55, 2.61s/it]g-point operations will not be computed-18 11:17:50,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1442/17840 [2:19:52<11:52:55, 2.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:17:53,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1442/17840 [2:19:52<11:52:55, 2.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:17:53,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:17:57,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:17:53,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1443/17840 [2:20:00<18:42:21, 4.11s/it]g-point operations will not be computed-18 11:17:53,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1443/17840 [2:20:00<18:42:21, 4.11s/it]g-point operations will not be computed-18 11:17:53,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1443/17840 [2:20:00<18:42:21, 4.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:18:01,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1443/17840 [2:20:00<18:42:21, 4.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:18:01,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:18:04,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:01,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:18:04,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:01,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1444/17840 [2:20:07<23:14:20, 5.10s/it]g-point operations will not be computed-18 11:18:01,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1444/17840 [2:20:07<23:14:20, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:18:12,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1445/17840 [2:20:14<26:12:37, 5.76s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1445/17840 [2:20:14<26:12:37, 5.76s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1657, 'learning_rate': 9.737529691211402e-05, 'epoch': 1.62} + 8%|█████▉ | 1445/17840 [2:20:14<26:12:37, 5.76s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1445/17840 [2:20:14<26:12:37, 5.76s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1445/17840 [2:20:14<26:12:37, 5.76s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1446/17840 [2:20:21<28:09:11, 6.18s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1446/17840 [2:20:21<28:09:11, 6.18s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:18:26,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:20:29<29:26:10, 6.46s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:20:29<29:26:10, 6.46s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9176, 'learning_rate': 9.736342042755346e-05, 'epoch': 1.62} + 8%|█████▉ | 1447/17840 [2:20:29<29:26:10, 6.46s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:20:29<29:26:10, 6.46s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:20:29<29:26:10, 6.46s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1448/17840 [2:20:36<30:12:59, 6.64s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:18:38,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:18:38,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:20:43<30:43:10, 6.75s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:20:43<30:43:10, 6.75s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0125, 'learning_rate': 9.735154394299287e-05, 'epoch': 1.62} + 8%|█████▉ | 1449/17840 [2:20:43<30:43:10, 6.75s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:20:43<30:43:10, 6.75s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1450/17840 [2:20:50<31:45:10, 6.97s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1450/17840 [2:20:50<31:45:10, 6.97s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0736, 'learning_rate': 9.734560570071259e-05, 'epoch': 1.63} +[WARNING|modeling_utils.py:388] 2022-03-18 11:18:55,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1451/17840 [2:20:57<31:52:02, 7.00s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1451/17840 [2:20:57<31:52:02, 7.00s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5562, 'learning_rate': 9.73396674584323e-05, 'epoch': 1.63} + 8%|█████▉ | 1451/17840 [2:20:57<31:52:02, 7.00s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1451/17840 [2:20:57<31:52:02, 7.00s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1451/17840 [2:20:57<31:52:02, 7.00s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1452/17840 [2:21:04<31:46:18, 6.98s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:07,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:07,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:21:11<31:41:05, 6.96s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:21:11<31:41:05, 6.96s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2716, 'learning_rate': 9.732779097387174e-05, 'epoch': 1.63} + 8%|█████▉ | 1453/17840 [2:21:11<31:41:05, 6.96s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:17,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:17,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9757, 'learning_rate': 9.732185273159146e-05, 'epoch': 1.63} +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:17,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:17,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1455/17840 [2:21:25<31:14:36, 6.86s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1455/17840 [2:21:25<31:14:36, 6.86s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:27,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:27,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1456/17840 [2:21:31<31:05:55, 6.83s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1456/17840 [2:21:31<31:05:55, 6.83s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0642, 'learning_rate': 9.730997624703089e-05, 'epoch': 1.63} +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:36,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1457/17840 [2:21:38<30:56:29, 6.80s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1457/17840 [2:21:38<30:56:29, 6.80s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8991, 'learning_rate': 9.73040380047506e-05, 'epoch': 1.63} + 8%|█████▉ | 1457/17840 [2:21:38<30:56:29, 6.80s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:44,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:44,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:44,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8158, 'learning_rate': 9.729809976247031e-05, 'epoch': 1.63} +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:44,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1459/17840 [2:21:51<30:39:43, 6.74s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1459/17840 [2:21:51<30:39:43, 6.74s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:54,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:54,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:19:54,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1460/17840 [2:21:58<30:32:41, 6.71s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1460/17840 [2:21:58<30:32:41, 6.71s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1460/17840 [2:21:58<30:32:41, 6.71s/it]g-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:04,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:04,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.851, 'learning_rate': 9.728028503562946e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:04,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:04,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:04,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:18:08,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1462/17840 [2:22:11<30:12:11, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1462/17840 [2:22:11<30:12:11, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1462/17840 [2:22:11<30:12:11, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1462/17840 [2:22:11<30:12:11, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1463/17840 [2:22:18<29:51:21, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:20,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:20,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:20,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1464/17840 [2:22:24<29:36:58, 6.51s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:26,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:26,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:26,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1465/17840 [2:22:30<29:26:54, 6.47s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1465/17840 [2:22:30<29:26:54, 6.47s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:34,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:34,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1466/17840 [2:22:37<29:12:12, 6.42s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1466/17840 [2:22:37<29:12:12, 6.42s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:41,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:41,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1467/17840 [2:22:43<29:03:53, 6.39s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1467/17840 [2:22:43<29:03:53, 6.39s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:47,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:47,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1468/17840 [2:22:49<28:48:36, 6.33s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1468/17840 [2:22:49<28:48:36, 6.33s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:53,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:53,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1469/17840 [2:22:55<28:38:26, 6.30s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1469/17840 [2:22:55<28:38:26, 6.30s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:59,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:20:59,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1470/17840 [2:23:02<28:27:53, 6.26s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1470/17840 [2:23:02<28:27:53, 6.26s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:05,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:05,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1471/17840 [2:23:08<28:08:58, 6.19s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1471/17840 [2:23:08<28:08:58, 6.19s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:11,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:11,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1472/17840 [2:23:14<27:53:04, 6.13s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1472/17840 [2:23:14<27:53:04, 6.13s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:17,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:17,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1473/17840 [2:23:20<27:40:09, 6.09s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1473/17840 [2:23:20<27:40:09, 6.09s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:23,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:23,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1474/17840 [2:23:25<27:22:30, 6.02s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:28,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:28,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:28,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1475/17840 [2:23:32<27:45:38, 6.11s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:34,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:34,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:34,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1476/17840 [2:23:38<27:14:31, 5.99s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:40,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:42,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:42,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2602, 'learning_rate': 9.718527315914489e-05, 'epoch': 1.66} +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:46,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:46,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1478/17840 [2:23:48<26:00:15, 5.72s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1478/17840 [2:23:48<26:00:15, 5.72s/it]g-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:52,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:20:12,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1479/17840 [2:23:54<25:26:24, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:21:54,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1479/17840 [2:23:54<25:26:24, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:21:54,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:58,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:21:54,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:21:58,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:21:54,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:01,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:21:54,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:01,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:21:54,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:01,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:21:54,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1481/17840 [2:24:04<24:18:33, 5.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:05,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1481/17840 [2:24:04<24:18:33, 5.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:05,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:08,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:05,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:08,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:05,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:10,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:05,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:13,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:05,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:13,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:05,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9644, 'learning_rate': 9.714964370546319e-05, 'epoch': 1.66} +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:16,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:05,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:16,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:05,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1484/17840 [2:24:18<22:05:02, 4.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:18,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:20,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:18,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:20,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:18,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1485/17840 [2:24:22<21:03:43, 4.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:22,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1486/17840 [2:24:26<19:55:16, 4.39s/it]g-point operations will not be computed-18 11:22:22,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1486/17840 [2:24:26<19:55:16, 4.39s/it]g-point operations will not be computed-18 11:22:22,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1486/17840 [2:24:26<19:55:16, 4.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:26,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1487/17840 [2:24:29<18:42:49, 4.12s/it]g-point operations will not be computed-18 11:22:26,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1487/17840 [2:24:29<18:42:49, 4.12s/it]g-point operations will not be computed-18 11:22:26,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1487/17840 [2:24:29<18:42:49, 4.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:29,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1487/17840 [2:24:29<18:42:49, 4.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:29,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1488/17840 [2:24:33<17:31:07, 3.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:33,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1489/17840 [2:24:35<16:08:26, 3.55s/it]g-point operations will not be computed-18 11:22:33,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1489/17840 [2:24:35<16:08:26, 3.55s/it]g-point operations will not be computed-18 11:22:33,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:37,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:35,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:37,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:35,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:39,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:38,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:39,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:38,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:41,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:40,536 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:41,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:40,536 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1492/17840 [2:24:42<11:57:10, 2.63s/it]g-point operations will not be computed-18 11:22:40,536 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1492/17840 [2:24:42<11:57:10, 2.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:43,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:47,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:43,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1493/17840 [2:24:50<18:41:15, 4.12s/it]g-point operations will not be computed-18 11:22:43,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1493/17840 [2:24:50<18:41:15, 4.12s/it]g-point operations will not be computed-18 11:22:43,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1493/17840 [2:24:50<18:41:15, 4.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:51,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1493/17840 [2:24:50<18:41:15, 4.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:51,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:54,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:51,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:22:54,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:51,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1494/17840 [2:24:57<23:05:45, 5.09s/it]g-point operations will not be computed-18 11:22:51,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1494/17840 [2:24:57<23:05:45, 5.09s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1494/17840 [2:24:57<23:05:45, 5.09s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1494/17840 [2:24:57<23:05:45, 5.09s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1494/17840 [2:24:57<23:05:45, 5.09s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1495/17840 [2:25:04<26:15:40, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:23:07,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:23:07,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:25:12<28:03:20, 6.18s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:25:12<28:03:20, 6.18s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.982, 'learning_rate': 9.707244655581948e-05, 'epoch': 1.68} + 8%|██████ | 1496/17840 [2:25:12<28:03:20, 6.18s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:23:18,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:23:18,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0392, 'learning_rate': 9.706650831353919e-05, 'epoch': 1.68} +[WARNING|modeling_utils.py:388] 2022-03-18 11:23:18,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:23:18,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█���████▏ | 1498/17840 [2:25:26<30:16:02, 6.67s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1498/17840 [2:25:26<30:16:02, 6.67s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1327, 'learning_rate': 9.706057007125891e-05, 'epoch': 1.68} +[WARNING|modeling_utils.py:388] 2022-03-18 11:23:30,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1499/17840 [2:25:33<30:54:39, 6.81s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1499/17840 [2:25:33<30:54:39, 6.81s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0443, 'learning_rate': 9.705463182897863e-05, 'epoch': 1.68} + 8%|██████▏ | 1499/17840 [2:25:33<30:54:39, 6.81s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1499/17840 [2:25:33<30:54:39, 6.81s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1500/17840 [2:25:41<31:55:16, 7.03s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1500/17840 [2:25:41<31:55:16, 7.03s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9834, 'learning_rate': 9.704869358669835e-05, 'epoch': 1.68} + 8%|██████▏ | 1500/17840 [2:25:41<31:55:16, 7.03s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1500/17840 [2:25:41<31:55:16, 7.03s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1500/17840 [2:25:41<31:55:16, 7.03s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1501/17840 [2:25:48<31:52:48, 7.02s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:23:50,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:23:50,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1502/17840 [2:25:54<31:37:25, 6.97s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1502/17840 [2:25:54<31:37:25, 6.97s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2999, 'learning_rate': 9.703681710213777e-05, 'epoch': 1.68} +[WARNING|modeling_utils.py:388] 2022-03-18 11:23:59,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1503/17840 [2:26:01<31:27:21, 6.93s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1503/17840 [2:26:01<31:27:21, 6.93s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1083, 'learning_rate': 9.703087885985749e-05, 'epoch': 1.68} + 8%|██████▏ | 1503/17840 [2:26:01<31:27:21, 6.93s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:07,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:07,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:07,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0787, 'learning_rate': 9.702494061757719e-05, 'epoch': 1.69} +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:07,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1505/17840 [2:26:15<31:06:10, 6.85s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1505/17840 [2:26:15<31:06:10, 6.85s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:17,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:17,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1506/17840 [2:26:22<30:53:28, 6.81s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1506/17840 [2:26:22<30:53:28, 6.81s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.974, 'learning_rate': 9.701306413301663e-05, 'epoch': 1.69} + 8%|██████▏ | 1506/17840 [2:26:22<30:53:28, 6.81s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:27,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:27,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1478, 'learning_rate': 9.700712589073635e-05, 'epoch': 1.69} +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:27,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:27,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1508/17840 [2:26:35<30:24:10, 6.70s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1508/17840 [2:26:35<30:24:10, 6.70s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:37,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:37,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1509/17840 [2:26:41<30:18:50, 6.68s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1509/17840 [2:26:41<30:18:50, 6.68s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:44,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:44,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:44,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1510/17840 [2:26:48<30:08:09, 6.64s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1510/17840 [2:26:48<30:08:09, 6.64s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:52,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:52,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1511/17840 [2:26:54<29:56:51, 6.60s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1511/17840 [2:26:54<29:56:51, 6.60s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:24:59,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1512/17840 [2:27:01<29:46:46, 6.57s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1512/17840 [2:27:01<29:46:46, 6.57s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9289, 'learning_rate': 9.697743467933492e-05, 'epoch': 1.7} + 8%|██████▏ | 1512/17840 [2:27:01<29:46:46, 6.57s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:07,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:07,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1631, 'learning_rate': 9.697149643705464e-05, 'epoch': 1.7} +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:07,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:07,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:07,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1514/17840 [2:27:14<29:27:12, 6.49s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:16,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:16,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:16,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1515/17840 [2:27:20<29:24:05, 6.48s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:23,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:23,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:23,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1516/17840 [2:27:27<29:09:12, 6.43s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1516/17840 [2:27:27<29:09:12, 6.43s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:30,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:30,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1517/17840 [2:27:33<28:56:27, 6.38s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:35,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:35,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:35,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1518/17840 [2:27:39<28:37:28, 6.31s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:41,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:41,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:41,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1519/17840 [2:27:45<28:23:26, 6.26s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:47,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:47,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:47,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1520/17840 [2:27:51<28:13:42, 6.23s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1520/17840 [2:27:51<28:13:42, 6.23s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:55,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:25:55,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1521/17840 [2:27:57<28:00:43, 6.18s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:00,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:00,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:00,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1522/17840 [2:28:03<27:49:02, 6.14s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:06,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:06,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:06,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1523/17840 [2:28:09<27:31:56, 6.07s/it]g-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:12,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:12,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:12,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:22:58,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1524/17840 [2:28:15<27:19:43, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:26:16,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1524/17840 [2:28:15<27:19:43, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:26:16,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1524/17840 [2:28:15<27:19:43, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:26:16,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1525/17840 [2:28:22<27:47:01, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:26:16,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1525/17840 [2:28:22<27:47:01, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:26:16,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:24,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:16,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:24,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:16,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:24,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:16,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1526/17840 [2:28:27<27:14:07, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:26:28,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▏ | 1526/17840 [2:28:27<27:14:07, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:26:28,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:32,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:28,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:32,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:28,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2105, 'learning_rate': 9.688836104513065e-05, 'epoch': 1.71} +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:32,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:28,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:38,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:28,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:38,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:28,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:40,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:28,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:40,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:28,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1529/17840 [2:28:44<25:43:52, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:26:45,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1529/17840 [2:28:44<25:43:52, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:26:45,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0766, 'learning_rate': 9.687648456057008e-05, 'epoch': 1.71} +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:48,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:45,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:48,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:45,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3179, 'learning_rate': 9.687054631828979e-05, 'epoch': 1.72} +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:52,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:45,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1531/17840 [2:28:54<24:32:43, 5.42s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:26:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1531/17840 [2:28:54<24:32:43, 5.42s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:26:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1029, 'learning_rate': 9.686460807600951e-05, 'epoch': 1.72} +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:58,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:26:58,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:27:01,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:27:03,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:27:03,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0386, 'learning_rate': 9.685273159144893e-05, 'epoch': 1.72} +[WARNING|modeling_utils.py:388] 2022-03-18 11:27:06,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:27:06,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:26:55,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1534/17840 [2:29:08<22:08:31, 4.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:27:09,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:27:11,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:09,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:27:11,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:09,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1535/17840 [2:29:12<20:59:04, 4.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:27:13,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1536/17840 [2:29:16<19:49:53, 4.38s/it]g-point operations will not be computed-18 11:27:13,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1536/17840 [2:29:16<19:49:53, 4.38s/it]g-point operations will not be computed-18 11:27:13,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1536/17840 [2:29:16<19:49:53, 4.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:27:16,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1537/17840 [2:29:20<18:36:50, 4.11s/it]g-point operations will not be computed-18 11:27:16,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1537/17840 [2:29:20<18:36:50, 4.11s/it]g-point operations will not be computed-18 11:27:16,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:27:21,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:20,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1538/17840 [2:29:23<17:13:48, 3.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:27:23,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1538/17840 [2:29:23<17:13:48, 3.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:27:23,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1539/17840 [2:29:25<15:52:12, 3.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:27:25,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1539/17840 [2:29:25<15:52:12, 3.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:27:25,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1540/17840 [2:29:28<14:31:25, 3.21s/it]g-point operations will not be computed-18 11:27:25,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1540/17840 [2:29:28<14:31:25, 3.21s/it]g-point operations will not be computed-18 11:27:25,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1541/17840 [2:29:30<13:10:03, 2.91s/it]g-point operations will not be computed-18 11:27:28,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1541/17840 [2:29:30<13:10:03, 2.91s/it]g-point operations will not be computed-18 11:27:28,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1542/17840 [2:29:32<11:51:37, 2.62s/it]g-point operations will not be computed-18 11:27:30,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1542/17840 [2:29:32<11:51:37, 2.62s/it]g-point operations will not be computed-18 11:27:30,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1542/17840 [2:29:32<11:51:37, 2.62s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:27:33,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1542/17840 [2:29:32<11:51:37, 2.62s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:27:33,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:27:37,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:33,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1543/17840 [2:29:40<18:42:53, 4.13s/it]g-point operations will not be computed-18 11:27:33,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1543/17840 [2:29:40<18:42:53, 4.13s/it]g-point operations will not be computed-18 11:27:33,864 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1543/17840 [2:29:40<18:42:53, 4.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:27:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1543/17840 [2:29:40<18:42:53, 4.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:27:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:27:45,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1544/17840 [2:29:47<23:18:27, 5.15s/it]g-point operations will not be computed-18 11:27:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1544/17840 [2:29:47<23:18:27, 5.15s/it]g-point operations will not be computed-18 11:27:41,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1544/17840 [2:29:47<23:18:27, 5.15s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1544/17840 [2:29:47<23:18:27, 5.15s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:27:54,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:27:54,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4348, 'learning_rate': 9.678147268408551e-05, 'epoch': 1.73} +[WARNING|modeling_utils.py:388] 2022-03-18 11:27:54,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:27:54,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1546/17840 [2:30:02<28:12:39, 6.23s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1546/17840 [2:30:02<28:12:39, 6.23s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0984, 'learning_rate': 9.677553444180523e-05, 'epoch': 1.73} + 9%|██████▎ | 1546/17840 [2:30:02<28:12:39, 6.23s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1546/17840 [2:30:02<28:12:39, 6.23s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1547/17840 [2:30:09<29:31:38, 6.52s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1547/17840 [2:30:09<29:31:38, 6.52s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:28:12,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:28:12,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1548/17840 [2:30:16<30:18:06, 6.70s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1548/17840 [2:30:16<30:18:06, 6.70s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0009, 'learning_rate': 9.676365795724466e-05, 'epoch': 1.74} + 9%|██████▎ | 1548/17840 [2:30:16<30:18:06, 6.70s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:28:22,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:28:22,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.426, 'learning_rate': 9.675771971496438e-05, 'epoch': 1.74} +[WARNING|modeling_utils.py:388] 2022-03-18 11:28:22,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:28:22,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1550/17840 [2:30:31<31:44:51, 7.02s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1550/17840 [2:30:31<31:44:51, 7.02s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1106, 'learning_rate': 9.675178147268409e-05, 'epoch': 1.74} + 9%|██████▎ | 1550/17840 [2:30:31<31:44:51, 7.02s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1550/17840 [2:30:31<31:44:51, 7.02s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1550/17840 [2:30:31<31:44:51, 7.02s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1551/17840 [2:30:38<31:45:38, 7.02s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:28:40,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:28:40,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:28:40,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1552/17840 [2:30:45<31:43:33, 7.01s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1552/17840 [2:30:45<31:43:33, 7.01s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1552/17840 [2:30:45<31:43:33, 7.01s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:28:51,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:28:51,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2297, 'learning_rate': 9.673396674584323e-05, 'epoch': 1.74} +[WARNING|modeling_utils.py:388] 2022-03-18 11:28:51,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:28:51,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:28:51,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1554/17840 [2:30:58<31:18:41, 6.92s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:01,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:01,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:01,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1555/17840 [2:31:05<31:10:31, 6.89s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1555/17840 [2:31:05<31:10:31, 6.89s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1555/17840 [2:31:05<31:10:31, 6.89s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:11,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:11,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0144, 'learning_rate': 9.671615201900238e-05, 'epoch': 1.74} +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:11,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:11,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:11,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▎ | 1557/17840 [2:31:19<30:43:59, 6.79s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:21,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:21,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:21,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1558/17840 [2:31:25<30:32:54, 6.75s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1558/17840 [2:31:25<30:32:54, 6.75s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:29,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:29,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1559/17840 [2:31:32<30:17:16, 6.70s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1559/17840 [2:31:32<30:17:16, 6.70s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1559/17840 [2:31:32<30:17:16, 6.70s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:38,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:38,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2919, 'learning_rate': 9.669239904988125e-05, 'epoch': 1.75} +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:38,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:38,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:38,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1561/17840 [2:31:45<30:06:02, 6.66s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:48,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:48,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:48,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1562/17840 [2:31:52<29:55:16, 6.62s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:54,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:54,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:29:54,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1563/17840 [2:31:58<29:45:18, 6.58s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1563/17840 [2:31:58<29:45:18, 6.58s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:02,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1564/17840 [2:32:05<29:32:36, 6.53s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1564/17840 [2:32:05<29:32:36, 6.53s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1985, 'learning_rate': 9.666864608076009e-05, 'epoch': 1.75} + 9%|██████▍ | 1564/17840 [2:32:05<29:32:36, 6.53s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:10,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:10,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8319, 'learning_rate': 9.666270783847981e-05, 'epoch': 1.75} +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:15,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1566/17840 [2:32:17<29:09:45, 6.45s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1566/17840 [2:32:17<29:09:45, 6.45s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3295, 'learning_rate': 9.665676959619953e-05, 'epoch': 1.76} +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:21,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1567/17840 [2:32:24<28:55:33, 6.40s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1567/17840 [2:32:24<28:55:33, 6.40s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2935, 'learning_rate': 9.665083135391925e-05, 'epoch': 1.76} +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:28,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1568/17840 [2:32:30<28:44:11, 6.36s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1568/17840 [2:32:30<28:44:11, 6.36s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0292, 'learning_rate': 9.664489311163896e-05, 'epoch': 1.76} + 9%|██████▍ | 1568/17840 [2:32:30<28:44:11, 6.36s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:35,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:35,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9882, 'learning_rate': 9.663895486935868e-05, 'epoch': 1.76} +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:35,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:41,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:41,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1792, 'learning_rate': 9.663301662707838e-05, 'epoch': 1.76} +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:41,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:47,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:47,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9765, 'learning_rate': 9.66270783847981e-05, 'epoch': 1.76} +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:47,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:54,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:54,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0755, 'learning_rate': 9.662114014251783e-05, 'epoch': 1.76} +[WARNING|modeling_utils.py:388] 2022-03-18 11:30:58,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1573/17840 [2:33:00<27:38:43, 6.12s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1573/17840 [2:33:00<27:38:43, 6.12s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2607, 'learning_rate': 9.661520190023755e-05, 'epoch': 1.76} + 9%|██████▍ | 1573/17840 [2:33:00<27:38:43, 6.12s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:06,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:06,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8543, 'learning_rate': 9.660926365795725e-05, 'epoch': 1.76} +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:10,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1575/17840 [2:33:13<27:50:41, 6.16s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1575/17840 [2:33:13<27:50:41, 6.16s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9633, 'learning_rate': 9.660332541567696e-05, 'epoch': 1.77} +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:16,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1576/17840 [2:33:18<27:20:22, 6.05s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1576/17840 [2:33:18<27:20:22, 6.05s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2479, 'learning_rate': 9.659738717339668e-05, 'epoch': 1.77} +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:22,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:22,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1577/17840 [2:33:24<26:45:17, 5.92s/it]g-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:26,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:26,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:26,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:27:48,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1578/17840 [2:33:30<26:12:21, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:31:30,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1578/17840 [2:33:30<26:12:21, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:31:30,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:34,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:30,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:34,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:30,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9595, 'learning_rate': 9.657957244655583e-05, 'epoch': 1.77} +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:38,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:30,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:38,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:30,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1580/17840 [2:33:40<25:04:53, 5.55s/it]g-point operations will not be computed-18 11:31:30,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:42,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:30,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:42,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:30,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:42,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:30,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1581/17840 [2:33:45<24:32:30, 5.43s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:48,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:48,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▍ | 1582/17840 [2:33:50<23:51:29, 5.28s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:52,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:52,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:54,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:56,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:56,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:31:59,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:01,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:01,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:03,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:05,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:05,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:07,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:08,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:10,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:10,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:12,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:15,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:15,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:16,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:16,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4343, 'learning_rate': 9.652019002375298e-05, 'epoch': 1.78} +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:19,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:19,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:21,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:21,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:23,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:23,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:27,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:27,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:27,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:30,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:30,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:34,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:34,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:34,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:38,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:38,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:38,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:45,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:45,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0415, 'learning_rate': 9.648456057007126e-05, 'epoch': 1.79} +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:45,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:45,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:32:45,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1596/17840 [2:34:53<28:02:43, 6.22s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1596/17840 [2:34:53<28:02:43, 6.22s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1596/17840 [2:34:53<28:02:43, 6.22s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1596/17840 [2:34:53<28:02:43, 6.22s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1596/17840 [2:34:53<28:02:43, 6.22s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1597/17840 [2:35:00<29:23:03, 6.51s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:03,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:03,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:03,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1598/17840 [2:35:08<30:15:58, 6.71s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1598/17840 [2:35:08<30:15:58, 6.71s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1598/17840 [2:35:08<30:15:58, 6.71s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:14,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:14,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1058, 'learning_rate': 9.646080760095013e-05, 'epoch': 1.79} +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:14,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:14,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1600/17840 [2:35:23<32:01:39, 7.10s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1600/17840 [2:35:23<32:01:39, 7.10s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3186, 'learning_rate': 9.645486935866985e-05, 'epoch': 1.79} + 9%|██████▌ | 1600/17840 [2:35:23<32:01:39, 7.10s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1600/17840 [2:35:23<32:01:39, 7.10s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1600/17840 [2:35:23<32:01:39, 7.10s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1601/17840 [2:35:30<31:59:53, 7.09s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1601/17840 [2:35:30<31:59:53, 7.09s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1601/17840 [2:35:30<31:59:53, 7.09s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1601/17840 [2:35:30<31:59:53, 7.09s/it]g-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:36,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:36,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:36,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:36,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:36,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:31:46,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1603/17840 [2:35:43<31:41:35, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1603/17840 [2:35:43<31:41:35, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1603/17840 [2:35:43<31:41:35, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1603/17840 [2:35:43<31:41:35, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1604/17840 [2:35:50<31:28:54, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1604/17840 [2:35:50<31:28:54, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1604/17840 [2:35:50<31:28:54, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:56,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:56,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3885, 'learning_rate': 9.642517814726841e-05, 'epoch': 1.8} +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:56,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:56,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:33:56,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1606/17840 [2:36:04<31:08:37, 6.91s/it]g-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:07,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:07,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:07,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1607/17840 [2:36:11<30:51:15, 6.84s/it]g-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1607/17840 [2:36:11<30:51:15, 6.84s/it]g-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1607/17840 [2:36:11<30:51:15, 6.84s/it]g-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:17,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:17,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0232, 'learning_rate': 9.640736342042755e-05, 'epoch': 1.8} +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:17,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:17,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:17,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:33:44,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1609/17840 [2:36:24<30:31:38, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1609/17840 [2:36:24<30:31:38, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1609/17840 [2:36:24<30:31:38, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1609/17840 [2:36:24<30:31:38, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1610/17840 [2:36:31<30:20:59, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1610/17840 [2:36:31<30:20:59, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:35,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:35,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1611/17840 [2:36:37<30:11:13, 6.70s/it]g-point operations will not be computed-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1611/17840 [2:36:37<30:11:13, 6.70s/it]g-point operations will not be computed-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1611/17840 [2:36:37<30:11:13, 6.70s/it]g-point operations will not be computed-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:43,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:43,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.278, 'learning_rate': 9.638361045130642e-05, 'epoch': 1.81} +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:43,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:43,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:34:43,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:25,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1613/17840 [2:36:51<29:54:10, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1613/17840 [2:36:51<29:54:10, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1613/17840 [2:36:51<29:54:10, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1613/17840 [2:36:51<29:54:10, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1614/17840 [2:36:57<29:41:17, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:00,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:00,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:00,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1615/17840 [2:37:04<29:36:22, 6.57s/it]g-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1615/17840 [2:37:04<29:36:22, 6.57s/it]g-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:08,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1616/17840 [2:37:10<29:21:43, 6.52s/it]g-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1616/17840 [2:37:10<29:21:43, 6.52s/it]g-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9713, 'learning_rate': 9.635985748218528e-05, 'epoch': 1.81} +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:14,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1617/17840 [2:37:16<29:09:43, 6.47s/it]g-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▌ | 1617/17840 [2:37:16<29:09:43, 6.47s/it]g-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2488, 'learning_rate': 9.635391923990498e-05, 'epoch': 1.81} + 9%|██████▌ | 1617/17840 [2:37:16<29:09:43, 6.47s/it]g-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:22,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:22,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4229, 'learning_rate': 9.63479809976247e-05, 'epoch': 1.81} +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:22,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:28,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:28,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2648, 'learning_rate': 9.634204275534442e-05, 'epoch': 1.82} +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:28,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:35,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:35,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0949, 'learning_rate': 9.633610451306414e-05, 'epoch': 1.82} +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:35,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:35,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:35,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:34:51,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1621/17840 [2:37:42<28:37:15, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:35:42,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1621/17840 [2:37:42<28:37:15, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:35:42,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1621/17840 [2:37:42<28:37:15, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:35:42,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1621/17840 [2:37:42<28:37:15, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:35:42,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1622/17840 [2:37:48<28:22:58, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:35:49,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1622/17840 [2:37:48<28:22:58, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:35:49,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1622/17840 [2:37:48<28:22:58, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:35:49,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1622/17840 [2:37:48<28:22:58, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:35:49,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1623/17840 [2:37:54<28:06:38, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1623/17840 [2:37:54<28:06:38, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:59,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:59,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0419, 'learning_rate': 9.6312351543943e-05, 'epoch': 1.82} +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:59,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:35:59,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1625/17840 [2:38:07<28:21:28, 6.30s/it]g-point operations will not be computed-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1625/17840 [2:38:07<28:21:28, 6.30s/it]g-point operations will not be computed-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:09,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:09,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:09,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1626/17840 [2:38:12<27:57:13, 6.21s/it]g-point operations will not be computed-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:15,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:15,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:15,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:35:55,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1627/17840 [2:38:18<27:15:30, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:36:19,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1627/17840 [2:38:18<27:15:30, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:36:19,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:23,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:19,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:23,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:19,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1713, 'learning_rate': 9.628859857482185e-05, 'epoch': 1.83} +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:27,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:19,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1629/17840 [2:38:29<26:07:04, 5.80s/it]g-point operations will not be computed-18 11:36:19,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1629/17840 [2:38:29<26:07:04, 5.80s/it]g-point operations will not be computed-18 11:36:19,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:31,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:19,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:31,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:19,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:31,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:19,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1630/17840 [2:38:35<25:35:43, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:36:35,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1630/17840 [2:38:35<25:35:43, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:36:35,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:39,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:35,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:39,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:35,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8366, 'learning_rate': 9.6270783847981e-05, 'epoch': 1.83} +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:43,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:35,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:43,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:35,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1632/17840 [2:38:45<24:28:35, 5.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1632/17840 [2:38:45<24:28:35, 5.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:49,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:49,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:52,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:54,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:54,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:56,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:58,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:36:58,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:00,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:02,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:02,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:04,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:06,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:06,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:07,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:10,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:10,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:12,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:12,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:14,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:14,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:16,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:16,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:18,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:18,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.3906, 'learning_rate': 9.620546318289787e-05, 'epoch': 1.84} +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:22,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:26,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:26,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9513, 'learning_rate': 9.619952494061758e-05, 'epoch': 1.84} +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:30,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:30,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:33,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:33,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4166, 'learning_rate': 9.61935866983373e-05, 'epoch': 1.84} +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:33,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:33,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:41,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:41,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:41,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:41,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:37:41,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1646/17840 [2:39:49<28:04:14, 6.24s/it]g-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1646/17840 [2:39:49<28:04:14, 6.24s/it]g-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1646/17840 [2:39:49<28:04:14, 6.24s/it]g-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1646/17840 [2:39:49<28:04:14, 6.24s/it]g-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1646/17840 [2:39:49<28:04:14, 6.24s/it]g-point operations will not be computed-18 11:36:46,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1647/17840 [2:39:56<29:21:29, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1647/17840 [2:39:56<29:21:29, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1647/17840 [2:39:56<29:21:29, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1647/17840 [2:39:56<29:21:29, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1648/17840 [2:40:03<30:11:49, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1648/17840 [2:40:03<30:11:49, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▋ | 1648/17840 [2:40:03<30:11:49, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:09,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:09,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2048, 'learning_rate': 9.616389548693587e-05, 'epoch': 1.85} +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:09,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:09,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1650/17840 [2:40:18<31:40:38, 7.04s/it]g-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1650/17840 [2:40:18<31:40:38, 7.04s/it]g-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4351, 'learning_rate': 9.615795724465558e-05, 'epoch': 1.85} + 9%|██████▊ | 1650/17840 [2:40:18<31:40:38, 7.04s/it]g-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1650/17840 [2:40:18<31:40:38, 7.04s/it]g-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1650/17840 [2:40:18<31:40:38, 7.04s/it]g-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1651/17840 [2:40:25<31:41:38, 7.05s/it]g-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:28,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:28,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:28,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1652/17840 [2:40:32<31:37:11, 7.03s/it]g-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1652/17840 [2:40:32<31:37:11, 7.03s/it]g-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1652/17840 [2:40:32<31:37:11, 7.03s/it]g-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:38,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:38,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.868, 'learning_rate': 9.614014251781474e-05, 'epoch': 1.85} +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:38,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:38,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:38,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:37:57,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1654/17840 [2:40:46<31:17:56, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:38:47,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1654/17840 [2:40:46<31:17:56, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:38:47,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1654/17840 [2:40:46<31:17:56, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:38:47,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1654/17840 [2:40:46<31:17:56, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:38:47,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1655/17840 [2:40:52<31:06:29, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:38:47,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1655/17840 [2:40:52<31:06:29, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:38:47,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1655/17840 [2:40:52<31:06:29, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:38:47,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:58,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:38:47,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:58,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:38:47,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0638, 'learning_rate': 9.612232779097387e-05, 'epoch': 1.86} +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:58,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:38:47,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:58,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:38:47,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:38:58,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:38:47,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1657/17840 [2:41:06<30:44:33, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1657/17840 [2:41:06<30:44:33, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1657/17840 [2:41:06<30:44:33, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1657/17840 [2:41:06<30:44:33, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1658/17840 [2:41:13<30:40:07, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1658/17840 [2:41:13<30:40:07, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:39:17,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1659/17840 [2:41:19<30:28:48, 6.78s/it]g-point operations will not be computed-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1659/17840 [2:41:19<30:28:48, 6.78s/it]g-point operations will not be computed-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0324, 'learning_rate': 9.610451306413302e-05, 'epoch': 1.86} + 9%|██████▊ | 1659/17840 [2:41:19<30:28:48, 6.78s/it]g-point operations will not be computed-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:39:25,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:39:25,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0718, 'learning_rate': 9.609857482185274e-05, 'epoch': 1.86} +[WARNING|modeling_utils.py:388] 2022-03-18 11:39:25,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:39:25,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:39:25,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:07,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1661/17840 [2:41:33<30:06:06, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1661/17840 [2:41:33<30:06:06, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1661/17840 [2:41:33<30:06:06, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1662/17840 [2:41:39<30:01:16, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1662/17840 [2:41:39<30:01:16, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:39:42,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:39:42,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1663/17840 [2:41:46<29:50:49, 6.64s/it]g-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1663/17840 [2:41:46<29:50:49, 6.64s/it]g-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1143, 'learning_rate': 9.608076009501188e-05, 'epoch': 1.86} +[WARNING|modeling_utils.py:388] 2022-03-18 11:39:50,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1664/17840 [2:41:53<29:46:40, 6.63s/it]g-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1664/17840 [2:41:53<29:46:40, 6.63s/it]g-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4047, 'learning_rate': 9.60748218527316e-05, 'epoch': 1.87} + 9%|██████▊ | 1664/17840 [2:41:53<29:46:40, 6.63s/it]g-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:39:58,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:39:58,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9439, 'learning_rate': 9.606888361045132e-05, 'epoch': 1.87} +[WARNING|modeling_utils.py:388] 2022-03-18 11:39:58,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:05,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:05,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1585, 'learning_rate': 9.606294536817104e-05, 'epoch': 1.87} +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:05,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:05,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:05,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:39:34,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1667/17840 [2:42:12<29:09:49, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:40:13,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1667/17840 [2:42:12<29:09:49, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:40:13,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1667/17840 [2:42:12<29:09:49, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:40:13,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1667/17840 [2:42:12<29:09:49, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:40:13,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1668/17840 [2:42:18<28:55:15, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1668/17840 [2:42:18<28:55:15, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1668/17840 [2:42:18<28:55:15, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1668/17840 [2:42:18<28:55:15, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1669/17840 [2:42:24<28:40:28, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:27,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:27,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1670/17840 [2:42:31<28:26:24, 6.33s/it]g-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1670/17840 [2:42:31<28:26:24, 6.33s/it]g-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:33,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:33,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1671/17840 [2:42:37<28:08:36, 6.27s/it]g-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1671/17840 [2:42:37<28:08:36, 6.27s/it]g-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:39,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:39,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1672/17840 [2:42:43<27:53:07, 6.21s/it]g-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1672/17840 [2:42:43<27:53:07, 6.21s/it]g-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:45,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:45,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1673/17840 [2:42:49<27:38:48, 6.16s/it]g-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1673/17840 [2:42:49<27:38:48, 6.16s/it]g-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:51,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:51,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:40:51,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:40:19,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1674/17840 [2:42:55<27:32:33, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:40:56,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1674/17840 [2:42:55<27:32:33, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:40:56,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1674/17840 [2:42:55<27:32:33, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:40:56,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1675/17840 [2:43:01<27:48:12, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:40:56,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1675/17840 [2:43:01<27:48:12, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:40:56,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:03,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:40:56,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:03,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:40:56,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:03,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:40:56,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1676/17840 [2:43:07<27:15:40, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:41:08,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1676/17840 [2:43:07<27:15:40, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:41:08,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:12,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:08,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:12,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:08,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0913, 'learning_rate': 9.59976247030879e-05, 'epoch': 1.88} +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:16,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:08,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1678/17840 [2:43:18<25:58:41, 5.79s/it]g-point operations will not be computed-18 11:41:08,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1678/17840 [2:43:18<25:58:41, 5.79s/it]g-point operations will not be computed-18 11:41:08,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:20,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:08,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:20,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:08,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1679/17840 [2:43:23<25:28:22, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 1679/17840 [2:43:23<25:28:22, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2909, 'learning_rate': 9.598574821852732e-05, 'epoch': 1.88} +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:28,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:28,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9189, 'learning_rate': 9.597980997624704e-05, 'epoch': 1.88} +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1681/17840 [2:43:34<24:16:15, 5.41s/it]g-point operations will not be computed-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1681/17840 [2:43:34<24:16:15, 5.41s/it]g-point operations will not be computed-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:36,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:38,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:38,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:40,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:42,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:42,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.121, 'learning_rate': 9.596199524940617e-05, 'epoch': 1.89} +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:46,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:41:46,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:24,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1684/17840 [2:43:48<21:40:32, 4.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:41:48,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1685/17840 [2:43:52<20:41:48, 4.61s/it]g-point operations will not be computed-18 11:41:48,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1685/17840 [2:43:52<20:41:48, 4.61s/it]g-point operations will not be computed-18 11:41:48,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1685/17840 [2:43:52<20:41:48, 4.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:41:52,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1686/17840 [2:43:56<19:42:13, 4.39s/it]g-point operations will not be computed-18 11:41:52,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1686/17840 [2:43:56<19:42:13, 4.39s/it]g-point operations will not be computed-18 11:41:52,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1686/17840 [2:43:56<19:42:13, 4.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:41:56,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1686/17840 [2:43:56<19:42:13, 4.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:41:56,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1687/17840 [2:43:59<18:30:53, 4.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:41:59,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:42:01,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:59,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:42:01,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:41:59,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1688/17840 [2:44:02<17:14:59, 3.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:42:02,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1688/17840 [2:44:02<17:14:59, 3.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:42:02,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1689/17840 [2:44:05<15:52:01, 3.54s/it]g-point operations will not be computed-18 11:42:02,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1689/17840 [2:44:05<15:52:01, 3.54s/it]g-point operations will not be computed-18 11:42:02,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1690/17840 [2:44:08<14:29:16, 3.23s/it]g-point operations will not be computed-18 11:42:05,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:42:09,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:42:09,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1692/17840 [2:44:12<11:43:51, 2.62s/it]g-point operations will not be computed-18 11:42:10,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1692/17840 [2:44:12<11:43:51, 2.62s/it]g-point operations will not be computed-18 11:42:10,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1692/17840 [2:44:12<11:43:51, 2.62s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:42:13,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1692/17840 [2:44:12<11:43:51, 2.62s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:42:13,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:42:17,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:13,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:42:17,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:13,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1693/17840 [2:44:19<18:28:21, 4.12s/it]g-point operations will not be computed-18 11:42:13,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1693/17840 [2:44:19<18:28:21, 4.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:42:20,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1693/17840 [2:44:19<18:28:21, 4.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:42:20,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:42:24,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:20,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:42:24,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:20,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1694/17840 [2:44:27<23:00:30, 5.13s/it]g-point operations will not be computed-18 11:42:20,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 1694/17840 [2:44:27<23:00:30, 5.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:42:32,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1695/17840 [2:44:34<26:00:57, 5.80s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1695/17840 [2:44:34<26:00:57, 5.80s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1097, 'learning_rate': 9.589073634204276e-05, 'epoch': 1.9} + 10%|██████▉ | 1695/17840 [2:44:34<26:00:57, 5.80s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1695/17840 [2:44:34<26:00:57, 5.80s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1695/17840 [2:44:34<26:00:57, 5.80s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1696/17840 [2:44:41<27:56:52, 6.23s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1696/17840 [2:44:41<27:56:52, 6.23s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1696/17840 [2:44:41<27:56:52, 6.23s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:42:48,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:42:48,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0531, 'learning_rate': 9.587885985748219e-05, 'epoch': 1.9} +[WARNING|modeling_utils.py:388] 2022-03-18 11:42:48,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:42:48,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:42:48,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1698/17840 [2:44:56<30:00:50, 6.69s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1698/17840 [2:44:56<30:00:50, 6.69s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1698/17840 [2:44:56<30:00:50, 6.69s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1698/17840 [2:44:56<30:00:50, 6.69s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:43:02,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:43:02,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:43:02,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:43:02,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:43:02,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1700/17840 [2:45:10<31:38:53, 7.06s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1700/17840 [2:45:10<31:38:53, 7.06s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1700/17840 [2:45:10<31:38:53, 7.06s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1700/17840 [2:45:10<31:38:53, 7.06s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1700/17840 [2:45:10<31:38:53, 7.06s/it]g-point operations will not be computed-18 11:42:28,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1701/17840 [2:45:18<31:43:49, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1701/17840 [2:45:18<31:43:49, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1701/17840 [2:45:18<31:43:49, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1701/17840 [2:45:18<31:43:49, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1702/17840 [2:45:25<31:36:21, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1702/17840 [2:45:25<31:36:21, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1702/17840 [2:45:25<31:36:21, 7.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:43:31,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:43:31,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.928, 'learning_rate': 9.584323040380047e-05, 'epoch': 1.91} +[WARNING|modeling_utils.py:388] 2022-03-18 11:43:31,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:43:31,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:43:31,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1704/17840 [2:45:38<31:13:11, 6.97s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:43:41,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:43:41,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:43:41,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1705/17840 [2:45:45<30:59:17, 6.91s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1705/17840 [2:45:45<30:59:17, 6.91s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:43:49,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1706/17840 [2:45:52<30:50:35, 6.88s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1706/17840 [2:45:52<30:50:35, 6.88s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8683, 'learning_rate': 9.582541567695963e-05, 'epoch': 1.91} + 10%|██████▉ | 1706/17840 [2:45:52<30:50:35, 6.88s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1706/17840 [2:45:52<30:50:35, 6.88s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1706/17840 [2:45:52<30:50:35, 6.88s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1707/17840 [2:45:59<30:38:06, 6.84s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:01,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:01,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1708/17840 [2:46:05<30:27:15, 6.80s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1708/17840 [2:46:05<30:27:15, 6.80s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1365, 'learning_rate': 9.581353919239906e-05, 'epoch': 1.91} +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:10,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1709/17840 [2:46:12<30:17:49, 6.76s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|██████▉ | 1709/17840 [2:46:12<30:17:49, 6.76s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0049, 'learning_rate': 9.580760095011877e-05, 'epoch': 1.92} + 10%|██████▉ | 1709/17840 [2:46:12<30:17:49, 6.76s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:18,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:18,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8497, 'learning_rate': 9.580166270783848e-05, 'epoch': 1.92} +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:18,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:18,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:18,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1711/17840 [2:46:25<29:59:59, 6.70s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:28,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:28,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:28,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1712/17840 [2:46:32<29:41:20, 6.63s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1712/17840 [2:46:32<29:41:20, 6.63s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:36,421 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1713/17840 [2:46:38<29:33:59, 6.60s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1713/17840 [2:46:38<29:33:59, 6.60s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8785, 'learning_rate': 9.578384798099764e-05, 'epoch': 1.92} + 10%|███████ | 1713/17840 [2:46:38<29:33:59, 6.60s/it]g-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:44,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:44,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8382, 'learning_rate': 9.577790973871734e-05, 'epoch': 1.92} +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:44,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:50,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:50,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0187, 'learning_rate': 9.577197149643706e-05, 'epoch': 1.92} +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:50,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:57,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:57,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5097, 'learning_rate': 9.576603325415677e-05, 'epoch': 1.92} +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:57,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:57,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:44:57,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:43:19,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1717/17840 [2:47:04<29:00:25, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1717/17840 [2:47:04<29:00:25, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1717/17840 [2:47:04<29:00:25, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1717/17840 [2:47:04<29:00:25, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1718/17840 [2:47:10<28:47:39, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:13,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:13,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:13,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1719/17840 [2:47:17<28:31:07, 6.37s/it]g-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:19,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:19,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:19,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1720/17840 [2:47:23<28:14:57, 6.31s/it]g-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1720/17840 [2:47:23<28:14:57, 6.31s/it]g-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:27,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:27,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1721/17840 [2:47:29<28:01:50, 6.26s/it]g-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:31,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:31,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:31,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1722/17840 [2:47:35<27:46:55, 6.21s/it]g-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:37,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:37,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:37,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1723/17840 [2:47:41<27:33:35, 6.16s/it]g-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:43,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:43,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:43,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:05,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1724/17840 [2:47:47<27:19:23, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:45:48,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1724/17840 [2:47:47<27:19:23, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:45:48,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1724/17840 [2:47:47<27:19:23, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:45:48,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1725/17840 [2:47:54<27:46:10, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:45:48,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1725/17840 [2:47:54<27:46:10, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:45:48,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:56,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:48,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:56,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:48,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:45:56,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:45:48,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1726/17840 [2:47:59<27:23:41, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:46:00,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1726/17840 [2:47:59<27:23:41, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:46:00,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1726/17840 [2:47:59<27:23:41, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:46:00,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1726/17840 [2:47:59<27:23:41, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:46:00,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1727/17840 [2:48:05<26:53:58, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:46:06,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1727/17840 [2:48:05<26:53:58, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:46:06,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1727/17840 [2:48:05<26:53:58, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:46:06,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1727/17840 [2:48:05<26:53:58, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:46:06,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1728/17840 [2:48:11<26:27:12, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:46:12,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1728/17840 [2:48:11<26:27:12, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:46:12,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:16,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:12,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:16,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:12,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9858, 'learning_rate': 9.568883610451307e-05, 'epoch': 1.94} +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:20,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:12,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1730/17840 [2:48:22<25:24:55, 5.68s/it]g-point operations will not be computed-18 11:46:12,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1730/17840 [2:48:22<25:24:55, 5.68s/it]g-point operations will not be computed-18 11:46:12,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:24,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:12,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:12,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:26,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:12,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9641, 'learning_rate': 9.56769596199525e-05, 'epoch': 1.94} +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:30,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:12,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1732/17840 [2:48:32<24:05:58, 5.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████ | 1732/17840 [2:48:32<24:05:58, 5.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.285, 'learning_rate': 9.567102137767221e-05, 'epoch': 1.94} +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:39,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:41,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:41,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:43,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:45,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:47,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:49,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:49,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:51,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:52,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:52,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:54,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:54,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:57,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:58,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:46:58,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:01,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:01,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:03,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:03,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:05,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:05,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:09,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:09,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:13,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:13,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.099, 'learning_rate': 9.560570071258907e-05, 'epoch': 1.95} +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:17,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:17,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:20,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:20,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1713, 'learning_rate': 9.559976247030879e-05, 'epoch': 1.96} +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:24,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:24,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:24,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:46:33,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1745/17840 [2:49:28<25:49:48, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1745/17840 [2:49:28<25:49:48, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1745/17840 [2:49:28<25:49:48, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1746/17840 [2:49:36<27:43:20, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1746/17840 [2:49:36<27:43:20, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0094, 'learning_rate': 9.558788598574823e-05, 'epoch': 1.96} + 10%|███████▏ | 1746/17840 [2:49:36<27:43:20, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:42,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:42,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0573, 'learning_rate': 9.558194774346794e-05, 'epoch': 1.96} +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:42,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:42,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1748/17840 [2:49:50<29:48:58, 6.67s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1748/17840 [2:49:50<29:48:58, 6.67s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9218, 'learning_rate': 9.557600950118766e-05, 'epoch': 1.96} + 10%|███████▏ | 1748/17840 [2:49:50<29:48:58, 6.67s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:56,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:56,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3138, 'learning_rate': 9.557007125890737e-05, 'epoch': 1.96} +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:56,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:47:56,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1750/17840 [2:50:04<31:13:19, 6.99s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1750/17840 [2:50:04<31:13:19, 6.99s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3514, 'learning_rate': 9.556413301662707e-05, 'epoch': 1.96} + 10%|███████▏ | 1750/17840 [2:50:04<31:13:19, 6.99s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0101, 'learning_rate': 9.555819477434679e-05, 'epoch': 1.96} +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:10,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1752/17840 [2:50:18<30:53:46, 6.91s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1752/17840 [2:50:18<30:53:46, 6.91s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:21,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:21,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1753/17840 [2:50:25<30:41:59, 6.87s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1753/17840 [2:50:25<30:41:59, 6.87s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2397, 'learning_rate': 9.554631828978623e-05, 'epoch': 1.97} + 10%|███████▏ | 1753/17840 [2:50:25<30:41:59, 6.87s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:31,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:31,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0102, 'learning_rate': 9.554038004750594e-05, 'epoch': 1.97} +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:31,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:31,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1755/17840 [2:50:38<30:14:15, 6.77s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1755/17840 [2:50:38<30:14:15, 6.77s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:41,272 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:41,272 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1756/17840 [2:50:45<30:11:21, 6.76s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1756/17840 [2:50:45<30:11:21, 6.76s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0378, 'learning_rate': 9.552850356294537e-05, 'epoch': 1.97} +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:49,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1757/17840 [2:50:51<30:01:42, 6.72s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1757/17840 [2:50:51<30:01:42, 6.72s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3428, 'learning_rate': 9.552256532066509e-05, 'epoch': 1.97} + 10%|███████▏ | 1757/17840 [2:50:51<30:01:42, 6.72s/it]g-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:57,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:57,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3186, 'learning_rate': 9.55166270783848e-05, 'epoch': 1.97} +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:57,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:57,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:48:57,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:47:29,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1759/17840 [2:51:05<29:40:44, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:49:06,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1759/17840 [2:51:05<29:40:44, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:49:06,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1759/17840 [2:51:05<29:40:44, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:49:06,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1759/17840 [2:51:05<29:40:44, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:49:06,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1760/17840 [2:51:11<29:23:11, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1760/17840 [2:51:11<29:23:11, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1760/17840 [2:51:11<29:23:11, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1760/17840 [2:51:11<29:23:11, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1761/17840 [2:51:17<29:10:28, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1761/17840 [2:51:17<29:10:28, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:49:22,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:49:22,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1762/17840 [2:51:24<29:04:53, 6.51s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1762/17840 [2:51:24<29:04:53, 6.51s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:49:28,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:49:28,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1763/17840 [2:51:30<28:46:06, 6.44s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1763/17840 [2:51:30<28:46:06, 6.44s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:49:34,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:49:34,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1764/17840 [2:51:36<28:29:21, 6.38s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1764/17840 [2:51:36<28:29:21, 6.38s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:49:40,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:49:40,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1765/17840 [2:51:43<28:25:13, 6.36s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1765/17840 [2:51:43<28:25:13, 6.36s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:49:47,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1766/17840 [2:51:49<28:12:01, 6.32s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1766/17840 [2:51:49<28:12:01, 6.32s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0604, 'learning_rate': 9.546912114014253e-05, 'epoch': 1.98} +[WARNING|modeling_utils.py:388] 2022-03-18 11:49:53,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:49:53,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1767/17840 [2:51:55<27:52:54, 6.24s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1767/17840 [2:51:55<27:52:54, 6.24s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:49:59,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:49:59,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1768/17840 [2:52:01<27:33:01, 6.17s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1768/17840 [2:52:01<27:33:01, 6.17s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:05,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:05,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1769/17840 [2:52:07<27:05:47, 6.07s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1769/17840 [2:52:07<27:05:47, 6.07s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:10,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:10,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1770/17840 [2:52:13<26:44:12, 5.99s/it]g-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:15,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:15,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:15,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:49:12,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1771/17840 [2:52:18<26:19:35, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:50:19,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1771/17840 [2:52:18<26:19:35, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:50:19,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1771/17840 [2:52:18<26:19:35, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:50:19,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▏ | 1771/17840 [2:52:18<26:19:35, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:50:19,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1772/17840 [2:52:24<25:52:33, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:50:25,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1772/17840 [2:52:24<25:52:33, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:50:25,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1772/17840 [2:52:24<25:52:33, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:50:25,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:29,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:50:25,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:31,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:50:25,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:31,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:50:25,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:31,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:50:25,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1774/17840 [2:52:35<24:51:41, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:50:35,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1774/17840 [2:52:35<24:51:41, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:50:35,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:39,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:50:35,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:39,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:50:35,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9575, 'learning_rate': 9.541567695961996e-05, 'epoch': 1.99} +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:43,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:50:35,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:43,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:50:35,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1776/17840 [2:52:45<23:45:34, 5.32s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:50:45,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:48,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:50:45,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:48,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:50:45,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1777/17840 [2:52:49<22:29:42, 5.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:50:50,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:52,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:50:50,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:52,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:50:50,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1778/17840 [2:52:53<21:06:16, 4.73s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:50:54,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:55,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:50:54,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:50:55,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:50:54,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1779/17840 [2:52:57<19:42:33, 4.42s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:50:57,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1780/17840 [2:53:00<18:18:48, 4.11s/it]g-point operations will not be computed-18 11:50:57,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1780/17840 [2:53:00<18:18:48, 4.11s/it]g-point operations will not be computed-18 11:50:57,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:02,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:00,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:02,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:00,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1781/17840 [2:53:03<16:44:45, 3.75s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:51:03,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1782/17840 [2:53:06<15:15:17, 3.42s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:51:06,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1782/17840 [2:53:06<15:15:17, 3.42s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:51:06,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1783/17840 [2:53:08<13:49:29, 3.10s/it]g-point operations will not be computed-18 11:51:06,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1783/17840 [2:53:08<13:49:29, 3.10s/it]g-point operations will not be computed-18 11:51:06,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1784/17840 [2:53:10<12:14:31, 2.74s/it]g-point operations will not be computed-18 11:51:08,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1784/17840 [2:53:10<12:14:31, 2.74s/it]g-point operations will not be computed-18 11:51:08,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1784/17840 [2:53:10<12:14:31, 2.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:51:12,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1784/17840 [2:53:10<12:14:31, 2.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:51:12,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:16,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:12,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1785/17840 [2:53:18<19:10:53, 4.30s/it]g-point operations will not be computed-18 11:51:12,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1785/17840 [2:53:18<19:10:53, 4.30s/it]g-point operations will not be computed-18 11:51:12,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1785/17840 [2:53:18<19:10:53, 4.30s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1785/17840 [2:53:18<19:10:53, 4.30s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:23,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:23,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1786/17840 [2:53:26<23:19:48, 5.23s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1786/17840 [2:53:26<23:19:48, 5.23s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1786/17840 [2:53:26<23:19:48, 5.23s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:32,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:32,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9555, 'learning_rate': 9.534441805225654e-05, 'epoch': 2.0} +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:32,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:32,652 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1788/17840 [2:53:40<27:59:36, 6.28s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1788/17840 [2:53:40<27:59:36, 6.28s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7802, 'learning_rate': 9.533847980997626e-05, 'epoch': 2.0} + 10%|███████▎ | 1788/17840 [2:53:40<27:59:36, 6.28s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:47,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:47,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8618, 'learning_rate': 9.533254156769596e-05, 'epoch': 2.01} +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:47,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:47,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:47,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1790/17840 [2:53:54<29:55:54, 6.71s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1790/17840 [2:53:54<29:55:54, 6.71s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:51:59,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1791/17840 [2:54:01<30:20:24, 6.81s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1791/17840 [2:54:01<30:20:24, 6.81s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0668, 'learning_rate': 9.532066508313539e-05, 'epoch': 2.01} + 10%|███████▎ | 1791/17840 [2:54:01<30:20:24, 6.81s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1791/17840 [2:54:01<30:20:24, 6.81s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1791/17840 [2:54:01<30:20:24, 6.81s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1792/17840 [2:54:09<30:36:39, 6.87s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1792/17840 [2:54:09<30:36:39, 6.87s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:52:13,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1793/17840 [2:54:16<30:51:28, 6.92s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1793/17840 [2:54:16<30:51:28, 6.92s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6927, 'learning_rate': 9.530878859857483e-05, 'epoch': 2.01} + 10%|███████▎ | 1793/17840 [2:54:16<30:51:28, 6.92s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1793/17840 [2:54:16<30:51:28, 6.92s/it]g-point operations will not be computed-18 11:51:19,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1794/17840 [2:54:23<30:58:06, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1794/17840 [2:54:23<30:58:06, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7494, 'learning_rate': 9.530285035629454e-05, 'epoch': 2.01} + 10%|███████▎ | 1794/17840 [2:54:23<30:58:06, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1795/17840 [2:54:29<30:51:45, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1795/17840 [2:54:29<30:51:45, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9634, 'learning_rate': 9.529691211401426e-05, 'epoch': 2.01} + 10%|███████▎ | 1795/17840 [2:54:29<30:51:45, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:52:35,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:52:35,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8914, 'learning_rate': 9.529097387173397e-05, 'epoch': 2.01} +[WARNING|modeling_utils.py:388] 2022-03-18 11:52:35,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:52:35,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:52:35,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1797/17840 [2:54:43<30:43:21, 6.89s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:52:46,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:52:46,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1798/17840 [2:54:50<30:39:29, 6.88s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1798/17840 [2:54:50<30:39:29, 6.88s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5447, 'learning_rate': 9.52790973871734e-05, 'epoch': 2.02} + 10%|███████▎ | 1798/17840 [2:54:50<30:39:29, 6.88s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:52:56,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:52:56,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.867, 'learning_rate': 9.527315914489313e-05, 'epoch': 2.02} +[WARNING|modeling_utils.py:388] 2022-03-18 11:52:56,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:52:56,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1800/17840 [2:55:04<31:02:34, 6.97s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1800/17840 [2:55:04<31:02:34, 6.97s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8611, 'learning_rate': 9.526722090261283e-05, 'epoch': 2.02} +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:08,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1801/17840 [2:55:11<30:53:03, 6.93s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1801/17840 [2:55:11<30:53:03, 6.93s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7713, 'learning_rate': 9.526128266033255e-05, 'epoch': 2.02} + 10%|███████▎ | 1801/17840 [2:55:11<30:53:03, 6.93s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1801/17840 [2:55:11<30:53:03, 6.93s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1802/17840 [2:55:18<30:33:36, 6.86s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▎ | 1802/17840 [2:55:18<30:33:36, 6.86s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:20,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:20,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:20,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1803/17840 [2:55:24<30:16:13, 6.80s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1803/17840 [2:55:24<30:16:13, 6.80s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:28,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:28,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1804/17840 [2:55:31<30:01:54, 6.74s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1804/17840 [2:55:31<30:01:54, 6.74s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:35,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:35,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1805/17840 [2:55:37<29:47:09, 6.69s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1805/17840 [2:55:37<29:47:09, 6.69s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1805/17840 [2:55:37<29:47:09, 6.69s/it]g-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:43,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:43,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.454, 'learning_rate': 9.523159144893113e-05, 'epoch': 2.02} +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:43,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:43,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:43,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:52:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1807/17840 [2:55:51<29:32:51, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1807/17840 [2:55:51<29:32:51, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1807/17840 [2:55:51<29:32:51, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1807/17840 [2:55:51<29:32:51, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1808/17840 [2:55:57<29:14:45, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:59,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:59,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:53:59,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1809/17840 [2:56:03<29:01:34, 6.52s/it]g-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1809/17840 [2:56:03<29:01:34, 6.52s/it]g-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:07,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:07,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1810/17840 [2:56:10<28:39:34, 6.44s/it]g-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1810/17840 [2:56:10<28:39:34, 6.44s/it]g-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:13,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:13,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1811/17840 [2:56:16<28:16:18, 6.35s/it]g-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1811/17840 [2:56:16<28:16:18, 6.35s/it]g-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:20,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:20,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1812/17840 [2:56:22<28:04:27, 6.31s/it]g-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:24,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:24,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:24,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1813/17840 [2:56:28<27:48:06, 6.24s/it]g-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:30,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:30,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:30,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1814/17840 [2:56:34<27:33:52, 6.19s/it]g-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:36,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:36,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:36,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:53:51,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1815/17840 [2:56:40<27:12:41, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:54:41,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1815/17840 [2:56:40<27:12:41, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:54:41,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1815/17840 [2:56:40<27:12:41, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:54:41,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1815/17840 [2:56:40<27:12:41, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:54:41,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1816/17840 [2:56:46<26:56:08, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:54:41,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:48,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:54:41,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:48,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:54:41,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:48,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:54:41,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1817/17840 [2:56:52<26:39:52, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1817/17840 [2:56:52<26:39:52, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:57,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:54:57,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6389, 'learning_rate': 9.51603325415677e-05, 'epoch': 2.04} +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:01,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1819/17840 [2:57:03<25:48:51, 5.80s/it]g-point operations will not be computed-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1819/17840 [2:57:03<25:48:51, 5.80s/it]g-point operations will not be computed-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:05,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:08,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:08,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.3698, 'learning_rate': 9.514845605700713e-05, 'epoch': 2.04} +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1821/17840 [2:57:14<24:50:34, 5.58s/it]g-point operations will not be computed-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1821/17840 [2:57:14<24:50:34, 5.58s/it]g-point operations will not be computed-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:16,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:16,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:54:53,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1822/17840 [2:57:19<24:11:31, 5.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:55:19,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1822/17840 [2:57:19<24:11:31, 5.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:55:19,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:22,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:19,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1823/17840 [2:57:24<23:31:25, 5.29s/it]g-point operations will not be computed-18 11:55:19,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1823/17840 [2:57:24<23:31:25, 5.29s/it]g-point operations will not be computed-18 11:55:19,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:25,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:19,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:28,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:19,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:28,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:19,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:30,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:19,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:30,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:19,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1825/17840 [2:57:34<22:33:32, 5.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1825/17840 [2:57:34<22:33:32, 5.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:36,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1826/17840 [2:57:38<21:32:25, 4.84s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▍ | 1826/17840 [2:57:38<21:32:25, 4.84s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:39,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:41,478 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:41,478 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:43,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:45,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:45,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:48,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:48,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:50,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:51,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:51,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:54,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:54,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:56,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:56,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:58,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:55:58,893 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:00,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:00,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.0658, 'learning_rate': 9.506532066508314e-05, 'epoch': 2.06} +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:04,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:04,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:04,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:08,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:08,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:12,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:12,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:12,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:15,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:15,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:19,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:19,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:23,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:23,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:23,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:23,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:23,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1838/17840 [2:58:31<27:31:39, 6.19s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1838/17840 [2:58:31<27:31:39, 6.19s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:35,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1839/17840 [2:58:38<28:49:26, 6.48s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1839/17840 [2:58:38<28:49:26, 6.48s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9804, 'learning_rate': 9.503562945368172e-05, 'epoch': 2.06} + 10%|███████▌ | 1839/17840 [2:58:38<28:49:26, 6.48s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1839/17840 [2:58:38<28:49:26, 6.48s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1839/17840 [2:58:38<28:49:26, 6.48s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1840/17840 [2:58:45<29:34:21, 6.65s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1840/17840 [2:58:45<29:34:21, 6.65s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:49,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:56:49,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1841/17840 [2:58:52<30:02:00, 6.76s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1841/17840 [2:58:52<30:02:00, 6.76s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1841/17840 [2:58:52<30:02:00, 6.76s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1841/17840 [2:58:52<30:02:00, 6.76s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1841/17840 [2:58:52<30:02:00, 6.76s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1842/17840 [2:58:59<30:23:58, 6.84s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:02,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:02,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:02,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1843/17840 [2:59:06<30:33:48, 6.88s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1843/17840 [2:59:06<30:33:48, 6.88s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1843/17840 [2:59:06<30:33:48, 6.88s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1843/17840 [2:59:06<30:33:48, 6.88s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1843/17840 [2:59:06<30:33:48, 6.88s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1844/17840 [2:59:13<30:34:47, 6.88s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:15,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:15,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:15,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1845/17840 [2:59:20<30:30:09, 6.87s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1845/17840 [2:59:20<30:30:09, 6.87s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:24,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:24,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1846/17840 [2:59:27<30:31:36, 6.87s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1846/17840 [2:59:27<30:31:36, 6.87s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1846/17840 [2:59:27<30:31:36, 6.87s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:32,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:32,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:36,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:36,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:36,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1848/17840 [2:59:40<30:14:20, 6.81s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1848/17840 [2:59:40<30:14:20, 6.81s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:44,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:44,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1849/17840 [2:59:47<30:01:15, 6.76s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1849/17840 [2:59:47<30:01:15, 6.76s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1849/17840 [2:59:47<30:01:15, 6.76s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1849/17840 [2:59:47<30:01:15, 6.76s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1849/17840 [2:59:47<30:01:15, 6.76s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1850/17840 [2:59:54<30:26:13, 6.85s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:56,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:56,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:57:56,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1851/17840 [3:00:00<30:12:53, 6.80s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:03,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:03,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1852/17840 [3:00:07<29:53:49, 6.73s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1852/17840 [3:00:07<29:53:49, 6.73s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.738, 'learning_rate': 9.495843230403802e-05, 'epoch': 2.08} +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:11,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1853/17840 [3:00:14<29:44:45, 6.70s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1853/17840 [3:00:14<29:44:45, 6.70s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8687, 'learning_rate': 9.495249406175773e-05, 'epoch': 2.08} +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:18,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1854/17840 [3:00:20<29:24:17, 6.62s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1854/17840 [3:00:20<29:24:17, 6.62s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9134, 'learning_rate': 9.494655581947743e-05, 'epoch': 2.08} + 10%|███████▌ | 1854/17840 [3:00:20<29:24:17, 6.62s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:26,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:26,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8918, 'learning_rate': 9.494061757719715e-05, 'epoch': 2.08} +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:26,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:26,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1856/17840 [3:00:33<29:07:59, 6.56s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1856/17840 [3:00:33<29:07:59, 6.56s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:36,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:36,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1857/17840 [3:00:39<28:55:28, 6.51s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1857/17840 [3:00:39<28:55:28, 6.51s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:42,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:42,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1858/17840 [3:00:46<28:38:49, 6.45s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1858/17840 [3:00:46<28:38:49, 6.45s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6321, 'learning_rate': 9.49228028503563e-05, 'epoch': 2.08} +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:50,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1859/17840 [3:00:52<28:23:53, 6.40s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1859/17840 [3:00:52<28:23:53, 6.40s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:54,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:58:54,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1860/17840 [3:00:58<28:17:32, 6.37s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1860/17840 [3:00:58<28:17:32, 6.37s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6147, 'learning_rate': 9.491092636579573e-05, 'epoch': 2.09} +[WARNING|modeling_utils.py:388] 2022-03-18 11:59:02,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1861/17840 [3:01:04<27:59:54, 6.31s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1861/17840 [3:01:04<27:59:54, 6.31s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6511, 'learning_rate': 9.490498812351545e-05, 'epoch': 2.09} +[WARNING|modeling_utils.py:388] 2022-03-18 11:59:08,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1862/17840 [3:01:11<27:45:38, 6.25s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1862/17840 [3:01:11<27:45:38, 6.25s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4737, 'learning_rate': 9.489904988123516e-05, 'epoch': 2.09} +[WARNING|modeling_utils.py:388] 2022-03-18 11:59:14,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1863/17840 [3:01:17<27:33:53, 6.21s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 1863/17840 [3:01:17<27:33:53, 6.21s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6293, 'learning_rate': 9.489311163895488e-05, 'epoch': 2.09} +[WARNING|modeling_utils.py:388] 2022-03-18 11:59:20,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1864/17840 [3:01:23<27:19:24, 6.16s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1864/17840 [3:01:23<27:19:24, 6.16s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:59:25,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:59:25,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1865/17840 [3:01:29<27:11:09, 6.13s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1865/17840 [3:01:29<27:11:09, 6.13s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:59:31,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:59:31,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1866/17840 [3:01:35<26:57:55, 6.08s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1866/17840 [3:01:35<26:57:55, 6.08s/it]g-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:59:37,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:59:37,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:55:34,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1867/17840 [3:01:41<26:34:30, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:59:41,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1867/17840 [3:01:41<26:34:30, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:59:41,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7548, 'learning_rate': 9.486935866983373e-05, 'epoch': 2.09} + 10%|███████▋ | 1867/17840 [3:01:41<26:34:30, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:59:41,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1867/17840 [3:01:41<26:34:30, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:59:41,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1868/17840 [3:01:46<26:07:34, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1868/17840 [3:01:46<26:07:34, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:59:51,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:59:51,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7835, 'learning_rate': 9.485748218527316e-05, 'epoch': 2.1} +[WARNING|modeling_utils.py:388] 2022-03-18 11:59:55,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1870/17840 [3:01:57<25:08:20, 5.67s/it]g-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1870/17840 [3:01:57<25:08:20, 5.67s/it]g-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 11:59:59,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:02,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:02,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8714, 'learning_rate': 9.484560570071259e-05, 'epoch': 2.1} +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:06,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:06,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 1872/17840 [3:02:08<24:15:24, 5.47s/it]g-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:10,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:12,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:12,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6957, 'learning_rate': 9.483372921615203e-05, 'epoch': 2.1} +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:16,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:16,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1874/17840 [3:02:18<23:12:08, 5.23s/it]g-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:19,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:19,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:22,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:22,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:26,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:26,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 11:59:47,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1876/17840 [3:02:28<22:23:47, 5.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:00:28,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:30,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:00:28,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:30,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:00:28,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1877/17840 [3:02:32<21:15:37, 4.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:00:32,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:34,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:00:32,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:34,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:00:32,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1878/17840 [3:02:36<20:08:44, 4.54s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:00:36,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:38,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:00:36,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:38,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:00:36,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1879/17840 [3:02:39<18:59:44, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:00:40,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1879/17840 [3:02:39<18:59:44, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:00:40,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1880/17840 [3:02:43<17:50:19, 4.02s/it]g-point operations will not be computed-18 12:00:40,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:44,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:00:43,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:44,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:00:43,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1881/17840 [3:02:46<16:30:20, 3.72s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:00:46,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1881/17840 [3:02:46<16:30:20, 3.72s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:00:46,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1882/17840 [3:02:49<15:07:11, 3.41s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:00:48,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1882/17840 [3:02:49<15:07:11, 3.41s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:00:48,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1883/17840 [3:02:51<13:46:26, 3.11s/it]g-point operations will not be computed-18 12:00:48,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1883/17840 [3:02:51<13:46:26, 3.11s/it]g-point operations will not be computed-18 12:00:48,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1884/17840 [3:02:53<12:18:20, 2.78s/it]g-point operations will not be computed-18 12:00:51,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1884/17840 [3:02:53<12:18:20, 2.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:00:54,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1884/17840 [3:02:53<12:18:20, 2.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:00:54,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:58,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:00:54,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:00:58,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:00:54,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1885/17840 [3:03:01<18:39:44, 4.21s/it]g-point operations will not be computed-18 12:00:54,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1885/17840 [3:03:01<18:39:44, 4.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1885/17840 [3:03:01<18:39:44, 4.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:05,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:05,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1886/17840 [3:03:08<22:53:07, 5.16s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1886/17840 [3:03:08<22:53:07, 5.16s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1886/17840 [3:03:08<22:53:07, 5.16s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1886/17840 [3:03:08<22:53:07, 5.16s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:14,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:14,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:14,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:14,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:14,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1888/17840 [3:03:22<27:27:18, 6.20s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1888/17840 [3:03:22<27:27:18, 6.20s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1888/17840 [3:03:22<27:27:18, 6.20s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1888/17840 [3:03:22<27:27:18, 6.20s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:29,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:29,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:29,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:29,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:29,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1890/17840 [3:03:36<29:25:57, 6.64s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1890/17840 [3:03:36<29:25:57, 6.64s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:41,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:41,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1891/17840 [3:03:43<29:52:19, 6.74s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1891/17840 [3:03:43<29:52:19, 6.74s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1891/17840 [3:03:43<29:52:19, 6.74s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1891/17840 [3:03:43<29:52:19, 6.74s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1891/17840 [3:03:43<29:52:19, 6.74s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1892/17840 [3:03:50<30:08:11, 6.80s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:53,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:53,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:01:53,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1893/17840 [3:03:57<30:21:51, 6.85s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1893/17840 [3:03:57<30:21:51, 6.85s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▋ | 1893/17840 [3:03:57<30:21:51, 6.85s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:02:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:02:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8035, 'learning_rate': 9.470902612826605e-05, 'epoch': 2.12} +[WARNING|modeling_utils.py:388] 2022-03-18 12:02:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:02:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:02:03,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1895/17840 [3:04:11<30:19:59, 6.85s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:02:14,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:02:14,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:02:14,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1896/17840 [3:04:18<30:14:47, 6.83s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1896/17840 [3:04:18<30:14:47, 6.83s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1896/17840 [3:04:18<30:14:47, 6.83s/it]g-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:02:24,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:02:24,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6604, 'learning_rate': 9.469121140142518e-05, 'epoch': 2.13} +[WARNING|modeling_utils.py:388] 2022-03-18 12:02:24,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:02:24,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:02:24,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:01:02,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1898/17840 [3:04:31<29:53:07, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:02:32,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1898/17840 [3:04:31<29:53:07, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:02:32,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1898/17840 [3:04:31<29:53:07, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:02:32,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1898/17840 [3:04:31<29:53:07, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:02:32,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1899/17840 [3:04:38<29:49:03, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:02:32,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1899/17840 [3:04:38<29:49:03, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:02:32,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:02:42,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:02:32,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1900/17840 [3:04:45<30:22:13, 6.86s/it]g-point operations will not be computed-18 12:02:32,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1900/17840 [3:04:45<30:22:13, 6.86s/it]g-point operations will not be computed-18 12:02:32,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8324, 'learning_rate': 9.467339667458433e-05, 'epoch': 2.13} + 11%|███████▊ | 1900/17840 [3:04:45<30:22:13, 6.86s/it]g-point operations will not be computed-18 12:02:32,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1900/17840 [3:04:45<30:22:13, 6.86s/it]g-point operations will not be computed-18 12:02:32,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1900/17840 [3:04:45<30:22:13, 6.86s/it]g-point operations will not be computed-18 12:02:32,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1901/17840 [3:04:52<30:05:45, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1901/17840 [3:04:52<30:05:45, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1901/17840 [3:04:52<30:05:45, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1901/17840 [3:04:52<30:05:45, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1902/17840 [3:04:58<29:44:55, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:03:01,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:03:01,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:03:01,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1903/17840 [3:05:05<29:30:32, 6.67s/it]g-point operations will not be computed-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1903/17840 [3:05:05<29:30:32, 6.67s/it]g-point operations will not be computed-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:03:09,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1904/17840 [3:05:11<29:07:50, 6.58s/it]g-point operations will not be computed-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1904/17840 [3:05:11<29:07:50, 6.58s/it]g-point operations will not be computed-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6149, 'learning_rate': 9.464964370546318e-05, 'epoch': 2.13} + 11%|███████▊ | 1904/17840 [3:05:11<29:07:50, 6.58s/it]g-point operations will not be computed-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:03:17,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:03:17,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7419, 'learning_rate': 9.46437054631829e-05, 'epoch': 2.14} +[WARNING|modeling_utils.py:388] 2022-03-18 12:03:17,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:03:17,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:03:17,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:02:53,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1906/17840 [3:05:24<28:41:37, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:25,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1906/17840 [3:05:24<28:41:37, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:25,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1906/17840 [3:05:24<28:41:37, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:25,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1906/17840 [3:05:24<28:41:37, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:25,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1907/17840 [3:05:30<28:28:59, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:31,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1907/17840 [3:05:30<28:28:59, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:31,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1907/17840 [3:05:30<28:28:59, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:31,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1907/17840 [3:05:30<28:28:59, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:31,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1908/17840 [3:05:37<28:14:28, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:31,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:03:39,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:03:31,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:03:39,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:03:31,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:03:39,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:03:31,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1909/17840 [3:05:43<27:59:33, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:44,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1909/17840 [3:05:43<27:59:33, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:44,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1909/17840 [3:05:43<27:59:33, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:44,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1909/17840 [3:05:43<27:59:33, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:44,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1910/17840 [3:05:49<27:43:55, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:50,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1910/17840 [3:05:49<27:43:55, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:50,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1910/17840 [3:05:49<27:43:55, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:50,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1910/17840 [3:05:49<27:43:55, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:50,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1911/17840 [3:05:55<27:28:59, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:56,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1911/17840 [3:05:55<27:28:59, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:03:56,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:00,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:03:56,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:00,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:03:56,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9259, 'learning_rate': 9.460213776722092e-05, 'epoch': 2.14} +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:00,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:03:56,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:06,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:03:56,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:06,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:03:56,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9912, 'learning_rate': 9.459619952494062e-05, 'epoch': 2.14} +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:06,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:03:56,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:06,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:03:56,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:06,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:03:56,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1914/17840 [3:06:13<26:50:46, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:04:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1914/17840 [3:06:13<26:50:46, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:04:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:18,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:18,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7764, 'learning_rate': 9.458432304038005e-05, 'epoch': 2.15} +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:18,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:24,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:24,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6523, 'learning_rate': 9.457838479809976e-05, 'epoch': 2.15} +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:28,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1917/17840 [3:06:30<25:48:48, 5.84s/it]g-point operations will not be computed-18 12:04:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1917/17840 [3:06:30<25:48:48, 5.84s/it]g-point operations will not be computed-18 12:04:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:32,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:32,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:32,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:14,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1918/17840 [3:06:36<25:23:30, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:04:36,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1918/17840 [3:06:36<25:23:30, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:04:36,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:40,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:36,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:40,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:36,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5995, 'learning_rate': 9.456057007125892e-05, 'epoch': 2.15} +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:44,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:36,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1920/17840 [3:06:47<24:37:04, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:04:47,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1920/17840 [3:06:47<24:37:04, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:04:47,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.81, 'learning_rate': 9.455463182897863e-05, 'epoch': 2.15} +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:51,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:47,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:51,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:47,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5218, 'learning_rate': 9.454869358669835e-05, 'epoch': 2.15} +[WARNING|modeling_utils.py:388] 2022-03-18 12:04:55,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:47,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1922/17840 [3:06:57<23:39:23, 5.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:04:57,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▊ | 1922/17840 [3:06:57<23:39:23, 5.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:04:57,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4431, 'learning_rate': 9.454275534441805e-05, 'epoch': 2.15} +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:01,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:57,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:01,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:57,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:03,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:57,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:06,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:57,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:06,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:57,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4826, 'learning_rate': 9.453087885985748e-05, 'epoch': 2.16} +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:09,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:04:57,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1925/17840 [3:07:11<22:09:57, 5.01s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1925/17840 [3:07:11<22:09:57, 5.01s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6207, 'learning_rate': 9.45249406175772e-05, 'epoch': 2.16} +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:15,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:15,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:17,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:19,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:19,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:20,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:20,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:24,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:24,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:26,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:27,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:27,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:30,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:30,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:31,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:31,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:34,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:34,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:36,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:36,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:38,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:38,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:42,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:42,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:42,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:45,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:45,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:49,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:49,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:49,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:53,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:53,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:56,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:05:56,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:00,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:00,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:00,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:00,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:00,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1938/17840 [3:08:08<27:10:34, 6.15s/it]g-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1938/17840 [3:08:08<27:10:34, 6.15s/it]g-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:12,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:12,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1939/17840 [3:08:15<28:26:57, 6.44s/it]g-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1939/17840 [3:08:15<28:26:57, 6.44s/it]g-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1939/17840 [3:08:15<28:26:57, 6.44s/it]g-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1939/17840 [3:08:15<28:26:57, 6.44s/it]g-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1939/17840 [3:08:15<28:26:57, 6.44s/it]g-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1940/17840 [3:08:22<29:15:38, 6.63s/it]g-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:25,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:25,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:25,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1941/17840 [3:08:29<29:48:22, 6.75s/it]g-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1941/17840 [3:08:29<29:48:22, 6.75s/it]g-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1941/17840 [3:08:29<29:48:22, 6.75s/it]g-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1941/17840 [3:08:29<29:48:22, 6.75s/it]g-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1941/17840 [3:08:29<29:48:22, 6.75s/it]g-point operations will not be computed-18 12:05:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1942/17840 [3:08:36<30:04:34, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1942/17840 [3:08:36<30:04:34, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1942/17840 [3:08:36<30:04:34, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1942/17840 [3:08:36<30:04:34, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1943/17840 [3:08:43<30:18:07, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1943/17840 [3:08:43<30:18:07, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1943/17840 [3:08:43<30:18:07, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:49,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:49,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.629, 'learning_rate': 9.441211401425178e-05, 'epoch': 2.18} +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:49,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:49,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:49,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1945/17840 [3:08:57<30:19:35, 6.87s/it]g-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:59,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:59,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:06:59,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1946/17840 [3:09:04<30:13:06, 6.84s/it]g-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1946/17840 [3:09:04<30:13:06, 6.84s/it]g-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1946/17840 [3:09:04<30:13:06, 6.84s/it]g-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:07:10,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:07:10,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6351, 'learning_rate': 9.439429928741093e-05, 'epoch': 2.18} +[WARNING|modeling_utils.py:388] 2022-03-18 12:07:10,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:07:10,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:07:10,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:06:37,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1948/17840 [3:09:17<29:58:32, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1948/17840 [3:09:17<29:58:32, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1948/17840 [3:09:17<29:58:32, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1948/17840 [3:09:17<29:58:32, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1949/17840 [3:09:24<29:43:27, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1949/17840 [3:09:24<29:43:27, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:07:28,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1950/17840 [3:09:31<30:14:26, 6.85s/it]g-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1950/17840 [3:09:31<30:14:26, 6.85s/it]g-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5689, 'learning_rate': 9.437648456057007e-05, 'epoch': 2.19} + 11%|███████▉ | 1950/17840 [3:09:31<30:14:26, 6.85s/it]g-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1950/17840 [3:09:31<30:14:26, 6.85s/it]g-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1950/17840 [3:09:31<30:14:26, 6.85s/it]g-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1951/17840 [3:09:37<30:00:41, 6.80s/it]g-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:07:40,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:07:40,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:07:40,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1952/17840 [3:09:44<29:41:40, 6.73s/it]g-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:07:47,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:07:47,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1953/17840 [3:09:51<29:21:45, 6.65s/it]g-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1953/17840 [3:09:51<29:21:45, 6.65s/it]g-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6359, 'learning_rate': 9.435866983372922e-05, 'epoch': 2.19} +[WARNING|modeling_utils.py:388] 2022-03-18 12:07:55,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1954/17840 [3:09:57<29:09:36, 6.61s/it]g-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1954/17840 [3:09:57<29:09:36, 6.61s/it]g-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6352, 'learning_rate': 9.435273159144894e-05, 'epoch': 2.19} +[WARNING|modeling_utils.py:388] 2022-03-18 12:08:01,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1955/17840 [3:10:04<28:59:49, 6.57s/it]g-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|███████▉ | 1955/17840 [3:10:04<28:59:49, 6.57s/it]g-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5861, 'learning_rate': 9.434679334916865e-05, 'epoch': 2.19} + 11%|███████▉ | 1955/17840 [3:10:04<28:59:49, 6.57s/it]g-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:08:09,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:08:09,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7238, 'learning_rate': 9.434085510688837e-05, 'epoch': 2.19} +[WARNING|modeling_utils.py:388] 2022-03-18 12:08:09,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:08:09,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:08:09,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:07:18,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1957/17840 [3:10:16<28:35:09, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:08:17,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1957/17840 [3:10:16<28:35:09, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:08:17,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1957/17840 [3:10:16<28:35:09, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:08:17,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1958/17840 [3:10:23<28:25:17, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1958/17840 [3:10:23<28:25:17, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4974, 'learning_rate': 9.43289786223278e-05, 'epoch': 2.2} + 11%|████████ | 1958/17840 [3:10:23<28:25:17, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1958/17840 [3:10:23<28:25:17, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1959/17840 [3:10:29<28:14:37, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:08:31,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:08:31,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1960/17840 [3:10:35<27:56:26, 6.33s/it]g-point operations will not be computed-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1960/17840 [3:10:35<27:56:26, 6.33s/it]g-point operations will not be computed-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9728, 'learning_rate': 9.431710213776722e-05, 'epoch': 2.2} +[WARNING|modeling_utils.py:388] 2022-03-18 12:08:39,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1961/17840 [3:10:41<27:47:34, 6.30s/it]g-point operations will not be computed-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1961/17840 [3:10:41<27:47:34, 6.30s/it]g-point operations will not be computed-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:08:44,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:08:44,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1962/17840 [3:10:47<27:25:52, 6.22s/it]g-point operations will not be computed-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1962/17840 [3:10:47<27:25:52, 6.22s/it]g-point operations will not be computed-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:08:50,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:08:50,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:08:23,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1963/17840 [3:10:53<27:09:59, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:08:54,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1963/17840 [3:10:53<27:09:59, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:08:54,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7612, 'learning_rate': 9.429928741092637e-05, 'epoch': 2.2} + 11%|████████ | 1963/17840 [3:10:53<27:09:59, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:08:54,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1964/17840 [3:10:59<26:56:44, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:09:00,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1964/17840 [3:10:59<26:56:44, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:09:00,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6484, 'learning_rate': 9.429334916864608e-05, 'epoch': 2.2} +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:05,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:00,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:05,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:00,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:05,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:00,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4818, 'learning_rate': 9.428741092636581e-05, 'epoch': 2.2} +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:05,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:00,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:05,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:00,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1966/17840 [3:11:11<26:34:57, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:15,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1967/17840 [3:11:17<26:10:53, 5.94s/it]g-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1967/17840 [3:11:17<26:10:53, 5.94s/it]g-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4564, 'learning_rate': 9.427553444180524e-05, 'epoch': 2.21} +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:21,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:21,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1968/17840 [3:11:23<25:45:30, 5.84s/it]g-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:25,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:27,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:27,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:27,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:31,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1970/17840 [3:11:34<24:54:56, 5.65s/it]g-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1970/17840 [3:11:34<24:54:56, 5.65s/it]g-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6604, 'learning_rate': 9.425771971496437e-05, 'epoch': 2.21} +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:37,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1971/17840 [3:11:39<24:27:45, 5.55s/it]g-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1971/17840 [3:11:39<24:27:45, 5.55s/it]g-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:41,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:41,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:41,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:12,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1972/17840 [3:11:44<24:07:44, 5.47s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:47,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1973/17840 [3:11:49<23:28:26, 5.33s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1973/17840 [3:11:49<23:28:26, 5.33s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:51,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:53,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:53,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8517, 'learning_rate': 9.423396674584324e-05, 'epoch': 2.21} +[WARNING|modeling_utils.py:388] 2022-03-18 12:09:57,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1975/17840 [3:11:59<22:53:21, 5.19s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████ | 1975/17840 [3:11:59<22:53:21, 5.19s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:01,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:03,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:03,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:05,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:07,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:07,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:09,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:11,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:11,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:13,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:16,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:16,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:17,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:17,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:19,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:21,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:21,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.2907, 'learning_rate': 9.419239904988124e-05, 'epoch': 2.22} +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:24,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:24,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:26,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:26,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:27,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:27,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:31,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:34,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:34,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8703, 'learning_rate': 9.416864608076011e-05, 'epoch': 2.23} +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:38,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:38,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:38,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:42,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:42,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:46,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:46,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:46,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1987/17840 [3:12:50<25:24:18, 5.77s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1987/17840 [3:12:50<25:24:18, 5.77s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:55,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:10:55,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1988/17840 [3:12:57<27:12:04, 6.18s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1988/17840 [3:12:57<27:12:04, 6.18s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1988/17840 [3:12:57<27:12:04, 6.18s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1988/17840 [3:12:57<27:12:04, 6.18s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1988/17840 [3:12:57<27:12:04, 6.18s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1989/17840 [3:13:04<28:28:31, 6.47s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1989/17840 [3:13:04<28:28:31, 6.47s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:11:09,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1990/17840 [3:13:11<29:19:14, 6.66s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1990/17840 [3:13:11<29:19:14, 6.66s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6256, 'learning_rate': 9.413895486935867e-05, 'epoch': 2.23} + 11%|████████▏ | 1990/17840 [3:13:11<29:19:14, 6.66s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1990/17840 [3:13:11<29:19:14, 6.66s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1990/17840 [3:13:11<29:19:14, 6.66s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1991/17840 [3:13:18<29:44:28, 6.76s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:11:21,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:11:21,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:11:21,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1992/17840 [3:13:25<30:03:59, 6.83s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1992/17840 [3:13:25<30:03:59, 6.83s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1992/17840 [3:13:25<30:03:59, 6.83s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:11:31,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:11:31,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5347, 'learning_rate': 9.412114014251782e-05, 'epoch': 2.23} +[WARNING|modeling_utils.py:388] 2022-03-18 12:11:31,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:11:31,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:11:31,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1994/17840 [3:13:39<30:15:20, 6.87s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1994/17840 [3:13:39<30:15:20, 6.87s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1994/17840 [3:13:39<30:15:20, 6.87s/it]g-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:11:45,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:11:45,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6513, 'learning_rate': 9.410926365795725e-05, 'epoch': 2.24} +[WARNING|modeling_utils.py:388] 2022-03-18 12:11:45,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:11:45,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:11:45,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:09:45,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1996/17840 [3:13:53<30:09:51, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1996/17840 [3:13:53<30:09:51, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1996/17840 [3:13:53<30:09:51, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1996/17840 [3:13:53<30:09:51, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1997/17840 [3:14:00<30:06:07, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1997/17840 [3:14:00<30:06:07, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:04,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1998/17840 [3:14:06<29:59:00, 6.81s/it]g-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 1998/17840 [3:14:06<29:59:00, 6.81s/it]g-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5279, 'learning_rate': 9.409144893111639e-05, 'epoch': 2.24} + 11%|████████▏ | 1998/17840 [3:14:06<29:59:00, 6.81s/it]g-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:12,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:12,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8247, 'learning_rate': 9.408551068883611e-05, 'epoch': 2.24} +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:12,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:12,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2000/17840 [3:14:20<30:15:34, 6.88s/it]g-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2000/17840 [3:14:20<30:15:34, 6.88s/it]g-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:23,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:23,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2001/17840 [3:14:27<30:00:11, 6.82s/it]g-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2001/17840 [3:14:27<30:00:11, 6.82s/it]g-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7692, 'learning_rate': 9.407363420427554e-05, 'epoch': 2.24} + 11%|████████▏ | 2001/17840 [3:14:27<30:00:11, 6.82s/it]g-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:33,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:33,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5939, 'learning_rate': 9.406769596199525e-05, 'epoch': 2.24} +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:33,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:33,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:33,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:11:54,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2003/17840 [3:14:40<29:19:29, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2003/17840 [3:14:40<29:19:29, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2003/17840 [3:14:40<29:19:29, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2003/17840 [3:14:40<29:19:29, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2004/17840 [3:14:46<29:04:18, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:49,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:49,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2005/17840 [3:14:53<28:51:26, 6.56s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2005/17840 [3:14:53<28:51:26, 6.56s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.3792, 'learning_rate': 9.404988123515441e-05, 'epoch': 2.25} +[WARNING|modeling_utils.py:388] 2022-03-18 12:12:57,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2006/17840 [3:14:59<28:43:29, 6.53s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2006/17840 [3:14:59<28:43:29, 6.53s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.734, 'learning_rate': 9.404394299287412e-05, 'epoch': 2.25} +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:03,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2007/17840 [3:15:06<28:28:47, 6.48s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2007/17840 [3:15:06<28:28:47, 6.48s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6395, 'learning_rate': 9.403800475059384e-05, 'epoch': 2.25} +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:10,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2008/17840 [3:15:12<28:11:42, 6.41s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2008/17840 [3:15:12<28:11:42, 6.41s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.732, 'learning_rate': 9.403206650831354e-05, 'epoch': 2.25} +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:16,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2009/17840 [3:15:18<28:00:51, 6.37s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2009/17840 [3:15:18<28:00:51, 6.37s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.718, 'learning_rate': 9.402612826603325e-05, 'epoch': 2.25} + 11%|████████▏ | 2009/17840 [3:15:18<28:00:51, 6.37s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:24,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:24,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9042, 'learning_rate': 9.402019002375297e-05, 'epoch': 2.25} +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:24,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:30,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:30,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8304, 'learning_rate': 9.401425178147269e-05, 'epoch': 2.25} +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:30,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:36,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:36,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7248, 'learning_rate': 9.400831353919241e-05, 'epoch': 2.26} +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:36,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:42,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:42,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.672, 'learning_rate': 9.400237529691212e-05, 'epoch': 2.26} +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:42,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:42,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:48,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:48,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:52,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:52,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2015/17840 [3:15:55<26:45:05, 6.09s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2015/17840 [3:15:55<26:45:05, 6.09s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:58,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:13:58,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▏ | 2016/17840 [3:16:01<26:35:33, 6.05s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:03,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:03,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:03,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2017/17840 [3:16:07<26:17:14, 5.98s/it]g-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:09,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:09,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:09,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:12:41,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2018/17840 [3:16:12<25:57:15, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:14:13,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2018/17840 [3:16:12<25:57:15, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:14:13,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2018/17840 [3:16:12<25:57:15, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:14:13,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2018/17840 [3:16:12<25:57:15, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:14:13,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2019/17840 [3:16:18<25:32:23, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:14:19,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:21,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:19,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:21,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:19,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2020/17840 [3:16:23<25:00:56, 5.69s/it]g-point operations will not be computed-18 12:14:19,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:25,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:19,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:25,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:19,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:25,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:19,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2021/17840 [3:16:29<24:38:17, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:14:29,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2021/17840 [3:16:29<24:38:17, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:14:29,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:33,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:29,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:33,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:29,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:36,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:29,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:36,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:29,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:36,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:29,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2023/17840 [3:16:39<23:27:26, 5.34s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:14:39,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2023/17840 [3:16:39<23:27:26, 5.34s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:14:39,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:43,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:39,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:43,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:39,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:45,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:39,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:45,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:39,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:45,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:39,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2025/17840 [3:16:49<22:27:34, 5.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:14:49,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:51,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:49,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:51,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:49,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2026/17840 [3:16:53<21:22:25, 4.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:14:53,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:55,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:53,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:55,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:53,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2027/17840 [3:16:57<20:11:20, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:14:57,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:59,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:57,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:14:59,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:14:57,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2028/17840 [3:17:01<18:59:55, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:01,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2029/17840 [3:17:04<17:48:51, 4.06s/it]g-point operations will not be computed-18 12:15:01,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2029/17840 [3:17:04<17:48:51, 4.06s/it]g-point operations will not be computed-18 12:15:01,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:15:06,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:04,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:15:06,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:04,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2030/17840 [3:17:07<16:29:29, 3.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:07,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2030/17840 [3:17:07<16:29:29, 3.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:07,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2031/17840 [3:17:10<15:07:27, 3.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:10,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2032/17840 [3:17:12<13:48:16, 3.14s/it]g-point operations will not be computed-18 12:15:10,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2032/17840 [3:17:12<13:48:16, 3.14s/it]g-point operations will not be computed-18 12:15:10,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2033/17840 [3:17:14<12:33:05, 2.86s/it]g-point operations will not be computed-18 12:15:12,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2033/17840 [3:17:14<12:33:05, 2.86s/it]g-point operations will not be computed-18 12:15:12,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2034/17840 [3:17:16<11:23:34, 2.59s/it]g-point operations will not be computed-18 12:15:14,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2034/17840 [3:17:16<11:23:34, 2.59s/it]g-point operations will not be computed-18 12:15:14,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2034/17840 [3:17:16<11:23:34, 2.59s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:18,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2034/17840 [3:17:16<11:23:34, 2.59s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:18,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:15:21,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:18,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:15:21,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:18,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2035/17840 [3:17:24<18:01:14, 4.10s/it]g-point operations will not be computed-18 12:15:18,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2035/17840 [3:17:24<18:01:14, 4.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:25,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2035/17840 [3:17:24<18:01:14, 4.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:25,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:15:29,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:25,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:15:29,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:25,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2036/17840 [3:17:31<22:22:04, 5.10s/it]g-point operations will not be computed-18 12:15:25,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2036/17840 [3:17:31<22:22:04, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:33,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2036/17840 [3:17:31<22:22:04, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:33,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2036/17840 [3:17:31<22:22:04, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:33,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2036/17840 [3:17:31<22:22:04, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:33,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2037/17840 [3:17:39<25:22:26, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:40,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2037/17840 [3:17:39<25:22:26, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:40,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2037/17840 [3:17:39<25:22:26, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:40,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2037/17840 [3:17:39<25:22:26, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:40,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2038/17840 [3:17:46<27:15:52, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:40,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2038/17840 [3:17:46<27:15:52, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:40,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2038/17840 [3:17:46<27:15:52, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:40,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2038/17840 [3:17:46<27:15:52, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:40,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2038/17840 [3:17:46<27:15:52, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:40,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2039/17840 [3:17:53<28:25:44, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2039/17840 [3:17:53<28:25:44, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2039/17840 [3:17:53<28:25:44, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2039/17840 [3:17:53<28:25:44, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2040/17840 [3:18:00<29:11:42, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2040/17840 [3:18:00<29:11:42, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:16:05,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5982, 'learning_rate': 9.383610451306414e-05, 'epoch': 2.29} + g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2042/17840 [3:18:14<30:05:05, 6.86s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2042/17840 [3:18:14<30:05:05, 6.86s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:16:19,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2043/17840 [3:18:21<30:19:11, 6.91s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2043/17840 [3:18:21<30:19:11, 6.91s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.941, 'learning_rate': 9.382422802850357e-05, 'epoch': 2.29} + 11%|████████▎ | 2043/17840 [3:18:21<30:19:11, 6.91s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2043/17840 [3:18:21<30:19:11, 6.91s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2043/17840 [3:18:21<30:19:11, 6.91s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2044/17840 [3:18:28<30:23:11, 6.93s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:16:31,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:16:31,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2045/17840 [3:18:35<30:18:14, 6.91s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▎ | 2045/17840 [3:18:35<30:18:14, 6.91s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8203, 'learning_rate': 9.3812351543943e-05, 'epoch': 2.29} + 11%|████████▎ | 2045/17840 [3:18:35<30:18:14, 6.91s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:16:41,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:16:41,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6975, 'learning_rate': 9.380641330166271e-05, 'epoch': 2.29} +[WARNING|modeling_utils.py:388] 2022-03-18 12:16:41,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:16:41,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:16:41,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2047/17840 [3:18:49<30:09:20, 6.87s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:16:52,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:16:52,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2048/17840 [3:18:56<30:03:24, 6.85s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2048/17840 [3:18:56<30:03:24, 6.85s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6285, 'learning_rate': 9.379453681710214e-05, 'epoch': 2.3} + 11%|████████▍ | 2048/17840 [3:18:56<30:03:24, 6.85s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:02,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:02,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9999, 'learning_rate': 9.378859857482186e-05, 'epoch': 2.3} +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:02,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:02,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2050/17840 [3:19:10<30:24:50, 6.93s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2050/17840 [3:19:10<30:24:50, 6.93s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.524, 'learning_rate': 9.378266033254157e-05, 'epoch': 2.3} +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:14,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2051/17840 [3:19:16<30:10:36, 6.88s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 2051/17840 [3:19:16<30:10:36, 6.88s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7017, 'learning_rate': 9.377672209026129e-05, 'epoch': 2.3} + 11%|████████▍ | 2051/17840 [3:19:16<30:10:36, 6.88s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:22,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:22,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.743, 'learning_rate': 9.377078384798101e-05, 'epoch': 2.3} +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:22,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:22,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:22,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2053/17840 [3:19:30<29:29:28, 6.73s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:32,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:32,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2054/17840 [3:19:36<29:05:56, 6.64s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2054/17840 [3:19:36<29:05:56, 6.64s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:39,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:39,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2055/17840 [3:19:43<28:55:17, 6.60s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2055/17840 [3:19:43<28:55:17, 6.60s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7424, 'learning_rate': 9.375296912114014e-05, 'epoch': 2.3} +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:47,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2056/17840 [3:19:49<28:46:23, 6.56s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2056/17840 [3:19:49<28:46:23, 6.56s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.551, 'learning_rate': 9.374703087885986e-05, 'epoch': 2.3} + 12%|████████▍ | 2056/17840 [3:19:49<28:46:23, 6.56s/it]g-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:55,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:55,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5337, 'learning_rate': 9.374109263657957e-05, 'epoch': 2.31} +[WARNING|modeling_utils.py:388] 2022-03-18 12:17:55,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:18:01,478 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:18:01,478 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4615, 'learning_rate': 9.373515439429929e-05, 'epoch': 2.31} +[WARNING|modeling_utils.py:388] 2022-03-18 12:18:01,478 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:18:01,478 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:18:01,478 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:15:54,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2059/17840 [3:20:08<28:05:21, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:09,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2059/17840 [3:20:08<28:05:21, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:09,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2059/17840 [3:20:08<28:05:21, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:09,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2059/17840 [3:20:08<28:05:21, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:09,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2060/17840 [3:20:14<27:50:38, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:15,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2060/17840 [3:20:14<27:50:38, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:15,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2060/17840 [3:20:14<27:50:38, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:15,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2061/17840 [3:20:21<27:44:03, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:21,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2061/17840 [3:20:21<27:44:03, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:21,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7954, 'learning_rate': 9.371733966745844e-05, 'epoch': 2.31} + 12%|████████▍ | 2061/17840 [3:20:21<27:44:03, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:21,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2062/17840 [3:20:27<27:32:53, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:27,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2062/17840 [3:20:27<27:32:53, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:27,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7789, 'learning_rate': 9.371140142517814e-05, 'epoch': 2.31} + 12%|████████▍ | 2062/17840 [3:20:27<27:32:53, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:27,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2063/17840 [3:20:33<27:15:51, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:34,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2063/17840 [3:20:33<27:15:51, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:34,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8056, 'learning_rate': 9.370546318289786e-05, 'epoch': 2.31} +[WARNING|modeling_utils.py:388] 2022-03-18 12:18:38,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:18:34,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:18:38,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:18:34,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:18:38,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:18:34,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9689, 'learning_rate': 9.369952494061758e-05, 'epoch': 2.31} +[WARNING|modeling_utils.py:388] 2022-03-18 12:18:38,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:18:34,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2065/17840 [3:20:45<26:48:53, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:46,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2065/17840 [3:20:45<26:48:53, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:46,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6537, 'learning_rate': 9.36935866983373e-05, 'epoch': 2.32} + 12%|████████▍ | 2065/17840 [3:20:45<26:48:53, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:46,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2065/17840 [3:20:45<26:48:53, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:46,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2066/17840 [3:20:51<26:29:31, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:18:51,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:18:54,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:18:51,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:18:54,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:18:51,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2067/17840 [3:20:57<26:11:41, 5.98s/it]g-point operations will not be computed-18 12:18:51,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2067/17840 [3:20:57<26:11:41, 5.98s/it]g-point operations will not be computed-18 12:18:51,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:00,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:18:51,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:00,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:18:51,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2068/17840 [3:21:02<25:39:42, 5.86s/it]g-point operations will not be computed-18 12:18:51,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:04,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:18:51,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:04,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:18:51,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:04,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:18:51,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2069/17840 [3:21:08<25:14:33, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:19:08,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2069/17840 [3:21:08<25:14:33, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:19:08,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:12,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:08,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:12,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:08,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4091, 'learning_rate': 9.366389548693587e-05, 'epoch': 2.32} +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:16,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:08,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:16,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:08,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2071/17840 [3:21:18<24:25:40, 5.58s/it]g-point operations will not be computed-18 12:19:08,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:20,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:08,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:20,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:08,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:20,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:08,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2072/17840 [3:21:24<23:59:53, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:19:24,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2072/17840 [3:21:24<23:59:53, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:19:24,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2072/17840 [3:21:24<23:59:53, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:19:24,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:28,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:24,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:30,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:24,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:30,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:24,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:30,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:24,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2074/17840 [3:21:34<22:42:01, 5.18s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:36,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:36,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▍ | 2075/17840 [3:21:39<22:40:30, 5.18s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:40,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:40,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:42,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:44,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:44,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:46,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:48,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:48,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:50,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:52,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:52,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:53,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:53,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:57,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:58,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:19:58,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:03,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:03,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:05,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:05,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:06,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:06,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:10,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:10,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:10,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:13,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:13,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:17,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:21,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:21,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7896, 'learning_rate': 9.356888361045131e-05, 'epoch': 2.34} +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:24,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:24,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:24,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2087/17840 [3:22:29<25:12:08, 5.76s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2087/17840 [3:22:29<25:12:08, 5.76s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2087/17840 [3:22:29<25:12:08, 5.76s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:35,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:35,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7712, 'learning_rate': 9.355700712589074e-05, 'epoch': 2.34} +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:35,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:35,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:35,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2089/17840 [3:22:43<28:19:22, 6.47s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2089/17840 [3:22:43<28:19:22, 6.47s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2089/17840 [3:22:43<28:19:22, 6.47s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:49,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:49,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.498, 'learning_rate': 9.354513064133016e-05, 'epoch': 2.34} +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:49,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:49,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:20:49,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2091/17840 [3:22:57<29:43:57, 6.80s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2091/17840 [3:22:57<29:43:57, 6.80s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2091/17840 [3:22:57<29:43:57, 6.80s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:04,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:04,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5639, 'learning_rate': 9.35332541567696e-05, 'epoch': 2.35} +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:04,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:04,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:04,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2093/17840 [3:23:11<30:06:03, 6.88s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:14,536 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:14,536 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2094/17840 [3:23:18<30:09:22, 6.89s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2094/17840 [3:23:18<30:09:22, 6.89s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1038, 'learning_rate': 9.352137767220903e-05, 'epoch': 2.35} + 12%|████████▌ | 2094/17840 [3:23:18<30:09:22, 6.89s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:24,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:24,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7852, 'learning_rate': 9.351543942992874e-05, 'epoch': 2.35} +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:24,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:24,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:24,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2096/17840 [3:23:32<29:55:43, 6.84s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:34,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:34,951 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2097/17840 [3:23:39<29:48:15, 6.82s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2097/17840 [3:23:39<29:48:15, 6.82s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9661, 'learning_rate': 9.350356294536817e-05, 'epoch': 2.35} +[WARNING|modeling_utils.py:388] 2022-03-18 12:21:43,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2098/17840 [3:23:45<29:38:18, 6.78s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2098/17840 [3:23:45<29:38:18, 6.78s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6546, 'learning_rate': 9.34976247030879e-05, 'epoch': 2.35} + 12%|████████▌ | 2098/17840 [3:23:45<29:38:18, 6.78s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2098/17840 [3:23:45<29:38:18, 6.78s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2098/17840 [3:23:45<29:38:18, 6.78s/it]g-point operations will not be computed-18 12:19:34,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2099/17840 [3:23:52<29:31:49, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2099/17840 [3:23:52<29:31:49, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2099/17840 [3:23:52<29:31:49, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2100/17840 [3:23:59<30:09:19, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2100/17840 [3:23:59<30:09:19, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6603, 'learning_rate': 9.348574821852733e-05, 'epoch': 2.35} + 12%|████████▌ | 2100/17840 [3:23:59<30:09:19, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:05,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:05,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6869, 'learning_rate': 9.347980997624703e-05, 'epoch': 2.36} +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:05,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:05,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:05,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2102/17840 [3:24:12<29:32:25, 6.76s/it]g-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:15,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:15,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:15,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2103/17840 [3:24:19<29:16:54, 6.70s/it]g-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2103/17840 [3:24:19<29:16:54, 6.70s/it]g-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:23,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2104/17840 [3:24:26<29:01:18, 6.64s/it]g-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2104/17840 [3:24:26<29:01:18, 6.64s/it]g-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5729, 'learning_rate': 9.346199524940618e-05, 'epoch': 2.36} + 12%|████████▌ | 2104/17840 [3:24:26<29:01:18, 6.64s/it]g-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:31,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:31,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6509, 'learning_rate': 9.34560570071259e-05, 'epoch': 2.36} +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:31,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:38,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:38,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6432, 'learning_rate': 9.345011876484561e-05, 'epoch': 2.36} +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:38,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:38,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:38,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:21:53,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2107/17840 [3:24:45<28:23:55, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2107/17840 [3:24:45<28:23:55, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2107/17840 [3:24:45<28:23:55, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▌ | 2107/17840 [3:24:45<28:23:55, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2108/17840 [3:24:51<28:09:14, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:54,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:54,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:22:54,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2109/17840 [3:24:57<27:53:33, 6.38s/it]g-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:00,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:00,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:00,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2110/17840 [3:25:04<27:46:04, 6.36s/it]g-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:06,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:06,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:06,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2111/17840 [3:25:10<27:39:17, 6.33s/it]g-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:12,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:12,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:12,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2112/17840 [3:25:16<27:25:13, 6.28s/it]g-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:18,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:18,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2113/17840 [3:25:22<27:10:52, 6.22s/it]g-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2113/17840 [3:25:22<27:10:52, 6.22s/it]g-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:24,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:24,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2114/17840 [3:25:28<26:56:56, 6.17s/it]g-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2114/17840 [3:25:28<26:56:56, 6.17s/it]g-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7802, 'learning_rate': 9.340261282660333e-05, 'epoch': 2.37} +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:32,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:32,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2115/17840 [3:25:34<26:43:44, 6.12s/it]g-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:37,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:37,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:37,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2116/17840 [3:25:40<26:36:12, 6.09s/it]g-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:43,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:43,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:43,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2117/17840 [3:25:46<26:24:04, 6.04s/it]g-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:48,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:48,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:48,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:22:46,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2118/17840 [3:25:52<26:02:24, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2118/17840 [3:25:52<26:02:24, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:57,333 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:23:57,333 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5834, 'learning_rate': 9.33729216152019e-05, 'epoch': 2.38} +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:01,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2120/17840 [3:26:03<25:10:21, 5.76s/it]g-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2120/17840 [3:26:03<25:10:21, 5.76s/it]g-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:05,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:05,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:05,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2121/17840 [3:26:09<24:49:44, 5.69s/it]g-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:11,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:13,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:13,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7444, 'learning_rate': 9.335510688836105e-05, 'epoch': 2.38} +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:17,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:17,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2123/17840 [3:26:19<23:43:07, 5.43s/it]g-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:21,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:23,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:23,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.3908, 'learning_rate': 9.334323040380048e-05, 'epoch': 2.38} +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:27,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:27,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:23:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2125/17840 [3:26:29<22:52:37, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2125/17840 [3:26:29<22:52:37, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:33,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:33,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:35,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:37,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:37,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:39,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:41,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:41,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:42,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:42,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:46,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:47,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:47,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:50,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:50,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:51,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:51,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:53,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:53,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:56,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:56,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:56,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:24:56,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:01,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:01,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:01,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:04,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:04,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:08,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:12,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:12,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9395, 'learning_rate': 9.327197149643706e-05, 'epoch': 2.39} +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:15,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:15,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2137/17840 [3:27:20<25:21:51, 5.81s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▋ | 2137/17840 [3:27:20<25:21:51, 5.81s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5977, 'learning_rate': 9.326603325415676e-05, 'epoch': 2.4} + 12%|████████▋ | 2137/17840 [3:27:20<25:21:51, 5.81s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:26,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:26,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8314, 'learning_rate': 9.32600950118765e-05, 'epoch': 2.4} +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:26,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:26,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:26,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2139/17840 [3:27:34<28:15:28, 6.48s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2139/17840 [3:27:34<28:15:28, 6.48s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:39,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2140/17840 [3:27:41<29:05:23, 6.67s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2140/17840 [3:27:41<29:05:23, 6.67s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6866, 'learning_rate': 9.324821852731592e-05, 'epoch': 2.4} + 12%|████████▊ | 2140/17840 [3:27:41<29:05:23, 6.67s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2140/17840 [3:27:41<29:05:23, 6.67s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2141/17840 [3:27:48<29:35:55, 6.79s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2141/17840 [3:27:48<29:35:55, 6.79s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9056, 'learning_rate': 9.324228028503563e-05, 'epoch': 2.4} +[WARNING|modeling_utils.py:388] 2022-03-18 12:25:53,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2142/17840 [3:27:55<29:57:45, 6.87s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2142/17840 [3:27:55<29:57:45, 6.87s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1795, 'learning_rate': 9.323634204275535e-05, 'epoch': 2.4} + 12%|████████▊ | 2142/17840 [3:27:55<29:57:45, 6.87s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2142/17840 [3:27:55<29:57:45, 6.87s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2143/17840 [3:28:02<30:08:17, 6.91s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2143/17840 [3:28:02<30:08:17, 6.91s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:05,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:05,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2144/17840 [3:28:09<30:12:06, 6.93s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2144/17840 [3:28:09<30:12:06, 6.93s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6335, 'learning_rate': 9.322446555819478e-05, 'epoch': 2.4} + 12%|████████▊ | 2144/17840 [3:28:09<30:12:06, 6.93s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:15,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:15,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.598, 'learning_rate': 9.32185273159145e-05, 'epoch': 2.4} +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:15,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:15,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2146/17840 [3:28:23<30:08:33, 6.91s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2146/17840 [3:28:23<30:08:33, 6.91s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8772, 'learning_rate': 9.32125890736342e-05, 'epoch': 2.41} + 12%|████████▊ | 2146/17840 [3:28:23<30:08:33, 6.91s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:29,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:29,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7888, 'learning_rate': 9.320665083135393e-05, 'epoch': 2.41} +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:29,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:29,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2148/17840 [3:28:37<29:59:45, 6.88s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2148/17840 [3:28:37<29:59:45, 6.88s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:39,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:39,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2149/17840 [3:28:44<29:54:02, 6.86s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2149/17840 [3:28:44<29:54:02, 6.86s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7804, 'learning_rate': 9.319477434679335e-05, 'epoch': 2.41} +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:48,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:48,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:48,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7514, 'learning_rate': 9.318883610451306e-05, 'epoch': 2.41} +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:48,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:48,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:26:48,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2151/17840 [3:28:58<30:08:37, 6.92s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:00,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:00,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:00,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2152/17840 [3:29:04<29:45:34, 6.83s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2152/17840 [3:29:04<29:45:34, 6.83s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:09,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2153/17840 [3:29:11<29:26:47, 6.76s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2153/17840 [3:29:11<29:26:47, 6.76s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7306, 'learning_rate': 9.317102137767222e-05, 'epoch': 2.41} + 12%|████████▊ | 2153/17840 [3:29:11<29:26:47, 6.76s/it]g-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:17,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:17,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7306, 'learning_rate': 9.316508313539193e-05, 'epoch': 2.41} +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:17,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:17,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:17,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:24:30,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2155/17840 [3:29:24<28:55:18, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2155/17840 [3:29:24<28:55:18, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2155/17840 [3:29:24<28:55:18, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2155/17840 [3:29:24<28:55:18, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2156/17840 [3:29:30<28:39:13, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:33,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:33,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:33,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2157/17840 [3:29:37<28:25:50, 6.53s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2157/17840 [3:29:37<28:25:50, 6.53s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:41,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:41,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2158/17840 [3:29:43<28:16:20, 6.49s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2158/17840 [3:29:43<28:16:20, 6.49s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:47,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:47,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2159/17840 [3:29:49<28:00:37, 6.43s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2159/17840 [3:29:49<28:00:37, 6.43s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:27:54,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2160/17840 [3:29:56<28:00:09, 6.43s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2160/17840 [3:29:56<28:00:09, 6.43s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7073, 'learning_rate': 9.312945368171022e-05, 'epoch': 2.42} + 12%|████████▊ | 2160/17840 [3:29:56<28:00:09, 6.43s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:01,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:01,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7339, 'learning_rate': 9.312351543942993e-05, 'epoch': 2.42} +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:01,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:08,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:08,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5027, 'learning_rate': 9.311757719714965e-05, 'epoch': 2.42} +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:08,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:14,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:14,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7102, 'learning_rate': 9.311163895486936e-05, 'epoch': 2.42} +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:18,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2164/17840 [3:30:20<26:54:52, 6.18s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2164/17840 [3:30:20<26:54:52, 6.18s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6952, 'learning_rate': 9.310570071258908e-05, 'epoch': 2.43} +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:24,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2165/17840 [3:30:26<26:40:30, 6.13s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2165/17840 [3:30:26<26:40:30, 6.13s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7162, 'learning_rate': 9.30997624703088e-05, 'epoch': 2.43} +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:30,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2166/17840 [3:30:32<26:22:43, 6.06s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2166/17840 [3:30:32<26:22:43, 6.06s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.516, 'learning_rate': 9.30938242280285e-05, 'epoch': 2.43} +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:36,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:36,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2167/17840 [3:30:38<26:12:45, 6.02s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:40,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:40,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:40,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▊ | 2168/17840 [3:30:44<25:56:16, 5.96s/it]g-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:46,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:46,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:46,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:27:25,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2169/17840 [3:30:50<25:35:38, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:28:50,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2169/17840 [3:30:50<25:35:38, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:28:50,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:55,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:28:50,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:55,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:28:50,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6698, 'learning_rate': 9.307007125890736e-05, 'epoch': 2.43} +[WARNING|modeling_utils.py:388] 2022-03-18 12:28:59,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:28:50,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2171/17840 [3:31:01<24:57:52, 5.74s/it]g-point operations will not be computed-18 12:28:50,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2171/17840 [3:31:01<24:57:52, 5.74s/it]g-point operations will not be computed-18 12:28:50,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:03,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:28:50,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:03,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:28:50,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:03,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:28:50,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2172/17840 [3:31:06<24:29:53, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:29:07,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2172/17840 [3:31:06<24:29:53, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:29:07,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:11,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:07,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:11,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:07,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6894, 'learning_rate': 9.305225653206652e-05, 'epoch': 2.44} +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:15,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:07,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:15,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:07,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2174/17840 [3:31:17<23:23:02, 5.37s/it]g-point operations will not be computed-18 12:29:07,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:18,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:07,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:21,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:07,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:21,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:07,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6725, 'learning_rate': 9.304631828978623e-05, 'epoch': 2.44} +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:25,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:07,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:25,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:07,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2176/17840 [3:31:27<22:22:45, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:29:27,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:29,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:27,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:29,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:27,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2177/17840 [3:31:31<21:19:34, 4.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:29:31,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:33,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:31,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:33,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:31,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2178/17840 [3:31:35<20:06:56, 4.62s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:29:35,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:37,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:35,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:37,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:35,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2179/17840 [3:31:38<18:44:17, 4.31s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:29:39,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2180/17840 [3:31:42<17:16:47, 3.97s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:29:42,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2180/17840 [3:31:42<17:16:47, 3.97s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:29:42,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:43,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:42,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:43,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:42,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:46,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:44,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:46,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:44,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2182/17840 [3:31:47<14:10:40, 3.26s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:29:47,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2182/17840 [3:31:47<14:10:40, 3.26s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:29:47,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2183/17840 [3:31:49<12:47:50, 2.94s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:29:49,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2183/17840 [3:31:49<12:47:50, 2.94s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:29:49,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2184/17840 [3:31:51<11:28:30, 2.64s/it]g-point operations will not be computed-18 12:29:49,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2184/17840 [3:31:51<11:28:30, 2.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:29:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2184/17840 [3:31:51<11:28:30, 2.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:29:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:56,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:29:56,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:29:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2185/17840 [3:31:59<18:05:18, 4.16s/it]g-point operations will not be computed-18 12:29:52,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2185/17840 [3:31:59<18:05:18, 4.16s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:30:00,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:30:04,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:00,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2186/17840 [3:32:06<22:21:30, 5.14s/it]g-point operations will not be computed-18 12:30:00,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2186/17840 [3:32:06<22:21:30, 5.14s/it]g-point operations will not be computed-18 12:30:00,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2186/17840 [3:32:06<22:21:30, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2186/17840 [3:32:06<22:21:30, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2186/17840 [3:32:06<22:21:30, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2187/17840 [3:32:13<25:06:03, 5.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2187/17840 [3:32:13<25:06:03, 5.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9603, 'learning_rate': 9.29750593824228e-05, 'epoch': 2.45} +[WARNING|modeling_utils.py:388] 2022-03-18 12:30:18,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2188/17840 [3:32:21<26:57:23, 6.20s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2188/17840 [3:32:21<26:57:23, 6.20s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7107, 'learning_rate': 9.296912114014252e-05, 'epoch': 2.45} + 12%|████████▉ | 2188/17840 [3:32:21<26:57:23, 6.20s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2188/17840 [3:32:21<26:57:23, 6.20s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2188/17840 [3:32:21<26:57:23, 6.20s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2189/17840 [3:32:28<28:09:51, 6.48s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2189/17840 [3:32:28<28:09:51, 6.48s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:30:32,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2190/17840 [3:32:35<29:02:20, 6.68s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2190/17840 [3:32:35<29:02:20, 6.68s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6108, 'learning_rate': 9.295724465558195e-05, 'epoch': 2.46} + 12%|████████▉ | 2190/17840 [3:32:35<29:02:20, 6.68s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2190/17840 [3:32:35<29:02:20, 6.68s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2191/17840 [3:32:42<29:28:32, 6.78s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2191/17840 [3:32:42<29:28:32, 6.78s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:30:45,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:30:45,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2192/17840 [3:32:49<29:49:57, 6.86s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2192/17840 [3:32:49<29:49:57, 6.86s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8916, 'learning_rate': 9.294536817102139e-05, 'epoch': 2.46} + 12%|████████▉ | 2192/17840 [3:32:49<29:49:57, 6.86s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2192/17840 [3:32:49<29:49:57, 6.86s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2192/17840 [3:32:49<29:49:57, 6.86s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2193/17840 [3:32:56<30:04:58, 6.92s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:30:59,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:30:59,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2194/17840 [3:33:03<30:14:17, 6.96s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2194/17840 [3:33:03<30:14:17, 6.96s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1626, 'learning_rate': 9.293349168646082e-05, 'epoch': 2.46} + 12%|████████▉ | 2194/17840 [3:33:03<30:14:17, 6.96s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:31:09,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:31:09,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7999, 'learning_rate': 9.292755344418053e-05, 'epoch': 2.46} +[WARNING|modeling_utils.py:388] 2022-03-18 12:31:09,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:31:09,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2196/17840 [3:33:17<29:57:49, 6.90s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2196/17840 [3:33:17<29:57:49, 6.90s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:31:19,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:31:19,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2197/17840 [3:33:24<29:50:28, 6.87s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2197/17840 [3:33:24<29:50:28, 6.87s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6005, 'learning_rate': 9.291567695961995e-05, 'epoch': 2.46} + 12%|████████▉ | 2197/17840 [3:33:24<29:50:28, 6.87s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:31:30,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:31:30,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5182, 'learning_rate': 9.290973871733967e-05, 'epoch': 2.46} +[WARNING|modeling_utils.py:388] 2022-03-18 12:31:30,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:31:30,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2199/17840 [3:33:37<29:37:48, 6.82s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|████████▉ | 2199/17840 [3:33:37<29:37:48, 6.82s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:31:40,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:31:40,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2200/17840 [3:33:44<30:07:04, 6.93s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2200/17840 [3:33:44<30:07:04, 6.93s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7991, 'learning_rate': 9.28978622327791e-05, 'epoch': 2.47} + 12%|█████████ | 2200/17840 [3:33:44<30:07:04, 6.93s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2200/17840 [3:33:44<30:07:04, 6.93s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2200/17840 [3:33:44<30:07:04, 6.93s/it]g-point operations will not be computed-18 12:30:07,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2201/17840 [3:33:51<29:52:15, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2201/17840 [3:33:51<29:52:15, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2201/17840 [3:33:51<29:52:15, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2202/17840 [3:33:58<29:31:39, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2202/17840 [3:33:58<29:31:39, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:00,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2203/17840 [3:34:04<29:16:45, 6.74s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2203/17840 [3:34:04<29:16:45, 6.74s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6029, 'learning_rate': 9.288004750593825e-05, 'epoch': 2.47} + 12%|█████████ | 2203/17840 [3:34:04<29:16:45, 6.74s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:10,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:10,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5806, 'learning_rate': 9.287410926365795e-05, 'epoch': 2.47} +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:10,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:17,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:17,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8428, 'learning_rate': 9.286817102137768e-05, 'epoch': 2.47} +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:17,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:17,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:17,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2206/17840 [3:34:24<28:47:17, 6.63s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:27,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2207/17840 [3:34:31<28:41:37, 6.61s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2207/17840 [3:34:31<28:41:37, 6.61s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:35,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:35,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2208/17840 [3:34:37<28:26:02, 6.55s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2208/17840 [3:34:37<28:26:02, 6.55s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:41,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:41,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2209/17840 [3:34:43<28:19:04, 6.52s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2209/17840 [3:34:43<28:19:04, 6.52s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:47,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:47,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2210/17840 [3:34:50<28:02:13, 6.46s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2210/17840 [3:34:50<28:02:13, 6.46s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2210/17840 [3:34:50<28:02:13, 6.46s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:55,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:32:55,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9506, 'learning_rate': 9.283254156769596e-05, 'epoch': 2.48} +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:00,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2212/17840 [3:35:02<27:27:54, 6.33s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2212/17840 [3:35:02<27:27:54, 6.33s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4871, 'learning_rate': 9.282660332541569e-05, 'epoch': 2.48} + 12%|█████████ | 2212/17840 [3:35:02<27:27:54, 6.33s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:08,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:08,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6678, 'learning_rate': 9.28206650831354e-05, 'epoch': 2.48} +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:08,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:14,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:14,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7967, 'learning_rate': 9.281472684085512e-05, 'epoch': 2.48} +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:14,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:20,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:20,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8285, 'learning_rate': 9.280878859857482e-05, 'epoch': 2.48} +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:20,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:20,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:26,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:26,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:30,598 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:30,598 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2217/17840 [3:35:32<26:08:42, 6.02s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2217/17840 [3:35:32<26:08:42, 6.02s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:36,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:36,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2218/17840 [3:35:38<25:40:56, 5.92s/it]g-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:40,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:43,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:43,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4843, 'learning_rate': 9.278503562945369e-05, 'epoch': 2.49} +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:43,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:48,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:48,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:51,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:51,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:51,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:31:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2221/17840 [3:35:54<24:26:19, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:33:55,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2221/17840 [3:35:54<24:26:19, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:33:55,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:59,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:33:55,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:33:59,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:33:55,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5613, 'learning_rate': 9.276722090261283e-05, 'epoch': 2.49} +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:03,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:33:55,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2223/17840 [3:36:05<23:11:20, 5.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:05,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2223/17840 [3:36:05<23:11:20, 5.35s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:05,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8562, 'learning_rate': 9.276128266033255e-05, 'epoch': 2.49} +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:09,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:05,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:09,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:05,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:11,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:05,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:11,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:05,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:11,475 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:05,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2225/17840 [3:36:14<22:06:11, 5.10s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:15,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:17,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:15,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:17,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:15,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2226/17840 [3:36:19<20:53:18, 4.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:19,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:21,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:19,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:21,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:19,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2227/17840 [3:36:22<19:37:22, 4.52s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:23,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2228/17840 [3:36:26<18:23:29, 4.24s/it]g-point operations will not be computed-18 12:34:23,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2228/17840 [3:36:26<18:23:29, 4.24s/it]g-point operations will not be computed-18 12:34:23,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:28,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:26,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2229/17840 [3:36:29<17:05:47, 3.94s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:29,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 2229/17840 [3:36:29<17:05:47, 3.94s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:29,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 2230/17840 [3:36:32<15:49:27, 3.65s/it]g-point operations will not be computed-18 12:34:29,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 2230/17840 [3:36:32<15:49:27, 3.65s/it]g-point operations will not be computed-18 12:34:29,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:34,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:32,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:34,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:32,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2231/17840 [3:36:35<14:42:29, 3.39s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:35,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2232/17840 [3:36:37<13:32:00, 3.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:37,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2232/17840 [3:36:37<13:32:00, 3.12s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:37,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2233/17840 [3:36:40<12:29:06, 2.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:40,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2233/17840 [3:36:40<12:29:06, 2.88s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:40,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2234/17840 [3:36:42<11:18:48, 2.61s/it]g-point operations will not be computed-18 12:34:40,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2234/17840 [3:36:42<11:18:48, 2.61s/it]g-point operations will not be computed-18 12:34:40,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2234/17840 [3:36:42<11:18:48, 2.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:43,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2234/17840 [3:36:42<11:18:48, 2.61s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:43,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:47,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:43,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2235/17840 [3:36:49<18:00:19, 4.15s/it]g-point operations will not be computed-18 12:34:43,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2235/17840 [3:36:49<18:00:19, 4.15s/it]g-point operations will not be computed-18 12:34:43,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2235/17840 [3:36:49<18:00:19, 4.15s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:51,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2235/17840 [3:36:49<18:00:19, 4.15s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:51,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:54,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:51,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:34:54,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:51,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2236/17840 [3:36:57<22:19:10, 5.15s/it]g-point operations will not be computed-18 12:34:51,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2236/17840 [3:36:57<22:19:10, 5.15s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:35:02,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2237/17840 [3:37:04<25:14:18, 5.82s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2237/17840 [3:37:04<25:14:18, 5.82s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0617, 'learning_rate': 9.267814726840855e-05, 'epoch': 2.51} + 13%|█████████▏ | 2237/17840 [3:37:04<25:14:18, 5.82s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2237/17840 [3:37:04<25:14:18, 5.82s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2238/17840 [3:37:12<26:57:50, 6.22s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2238/17840 [3:37:12<26:57:50, 6.22s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.951, 'learning_rate': 9.267220902612827e-05, 'epoch': 2.51} +[WARNING|modeling_utils.py:388] 2022-03-18 12:35:16,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2239/17840 [3:37:19<28:11:16, 6.50s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2239/17840 [3:37:19<28:11:16, 6.50s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5654, 'learning_rate': 9.266627078384799e-05, 'epoch': 2.51} + 13%|█████████▏ | 2239/17840 [3:37:19<28:11:16, 6.50s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2239/17840 [3:37:19<28:11:16, 6.50s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2240/17840 [3:37:26<29:06:10, 6.72s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2240/17840 [3:37:26<29:06:10, 6.72s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6129, 'learning_rate': 9.26603325415677e-05, 'epoch': 2.51} +[WARNING|modeling_utils.py:388] 2022-03-18 12:35:30,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2241/17840 [3:37:33<29:35:41, 6.83s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2241/17840 [3:37:33<29:35:41, 6.83s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9319, 'learning_rate': 9.265439429928742e-05, 'epoch': 2.51} + 13%|█████████▏ | 2241/17840 [3:37:33<29:35:41, 6.83s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2241/17840 [3:37:33<29:35:41, 6.83s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2242/17840 [3:37:40<29:50:59, 6.89s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2242/17840 [3:37:40<29:50:59, 6.89s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:35:43,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:35:43,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2243/17840 [3:37:47<30:04:31, 6.94s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2243/17840 [3:37:47<30:04:31, 6.94s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7415, 'learning_rate': 9.264251781472685e-05, 'epoch': 2.51} + 13%|█████████▏ | 2243/17840 [3:37:47<30:04:31, 6.94s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:35:53,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:35:53,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8762, 'learning_rate': 9.263657957244655e-05, 'epoch': 2.52} +[WARNING|modeling_utils.py:388] 2022-03-18 12:35:53,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:35:53,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:35:53,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2245/17840 [3:38:01<30:13:26, 6.98s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2245/17840 [3:38:01<30:13:26, 6.98s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:05,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:05,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2246/17840 [3:38:08<30:07:23, 6.95s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2246/17840 [3:38:08<30:07:23, 6.95s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2246/17840 [3:38:08<30:07:23, 6.95s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2246/17840 [3:38:08<30:07:23, 6.95s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2246/17840 [3:38:08<30:07:23, 6.95s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2247/17840 [3:38:15<29:55:03, 6.91s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:17,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:17,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:17,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2248/17840 [3:38:22<29:48:47, 6.88s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2248/17840 [3:38:22<29:48:47, 6.88s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2248/17840 [3:38:22<29:48:47, 6.88s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2248/17840 [3:38:22<29:48:47, 6.88s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:28,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:28,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:28,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:28,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:28,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2250/17840 [3:38:36<30:13:52, 6.98s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2250/17840 [3:38:36<30:13:52, 6.98s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:40,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:40,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2251/17840 [3:38:42<29:59:17, 6.93s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2251/17840 [3:38:42<29:59:17, 6.93s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2251/17840 [3:38:42<29:59:17, 6.93s/it]g-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:48,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:48,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6692, 'learning_rate': 9.258907363420429e-05, 'epoch': 2.52} +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:48,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:48,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:36:48,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:34:58,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2253/17840 [3:38:56<29:19:54, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2253/17840 [3:38:56<29:19:54, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2253/17840 [3:38:56<29:19:54, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2253/17840 [3:38:56<29:19:54, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2254/17840 [3:39:02<29:05:18, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:05,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:05,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2255/17840 [3:39:09<28:51:07, 6.66s/it]g-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2255/17840 [3:39:09<28:51:07, 6.66s/it]g-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6314, 'learning_rate': 9.257125890736342e-05, 'epoch': 2.53} +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:13,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2256/17840 [3:39:15<28:39:58, 6.62s/it]g-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2256/17840 [3:39:15<28:39:58, 6.62s/it]g-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8076, 'learning_rate': 9.256532066508314e-05, 'epoch': 2.53} +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:19,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2257/17840 [3:39:22<28:23:50, 6.56s/it]g-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▏ | 2257/17840 [3:39:22<28:23:50, 6.56s/it]g-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6699, 'learning_rate': 9.255938242280285e-05, 'epoch': 2.53} + 13%|█████████▏ | 2257/17840 [3:39:22<28:23:50, 6.56s/it]g-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:27,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:27,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7028, 'learning_rate': 9.255344418052257e-05, 'epoch': 2.53} +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:27,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:34,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:34,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7749, 'learning_rate': 9.254750593824229e-05, 'epoch': 2.53} +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:34,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:40,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:40,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7409, 'learning_rate': 9.2541567695962e-05, 'epoch': 2.53} +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:40,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:40,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:40,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:36:57,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2261/17840 [3:39:47<27:35:43, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:37:48,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2261/17840 [3:39:47<27:35:43, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:37:48,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2261/17840 [3:39:47<27:35:43, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:37:48,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2261/17840 [3:39:47<27:35:43, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:37:48,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2262/17840 [3:39:53<27:15:40, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:37:54,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2262/17840 [3:39:53<27:15:40, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:37:54,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:59,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:37:54,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:59,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:37:54,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5334, 'learning_rate': 9.252375296912114e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:59,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:37:54,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:59,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:37:54,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:37:59,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:37:54,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2264/17840 [3:40:05<26:42:03, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2264/17840 [3:40:05<26:42:03, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:11,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:11,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6536, 'learning_rate': 9.251187648456057e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:11,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:16,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:16,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5705, 'learning_rate': 9.250593824228029e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:21,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2267/17840 [3:40:23<25:47:38, 5.96s/it]g-point operations will not be computed-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2267/17840 [3:40:23<25:47:38, 5.96s/it]g-point operations will not be computed-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7498, 'learning_rate': 9.250000000000001e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:26,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2268/17840 [3:40:29<25:25:14, 5.88s/it]g-point operations will not be computed-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2268/17840 [3:40:29<25:25:14, 5.88s/it]g-point operations will not be computed-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:31,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:31,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:06,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2269/17840 [3:40:34<25:09:35, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:38:35,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2269/17840 [3:40:34<25:09:35, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:38:35,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.775, 'learning_rate': 9.248812351543944e-05, 'epoch': 2.54} +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:39,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:35,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:39,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:35,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:39,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:35,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:43,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:35,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:43,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:35,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2271/17840 [3:40:45<24:29:11, 5.66s/it]g-point operations will not be computed-18 12:38:35,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:47,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:35,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:47,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:35,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:47,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:35,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2272/17840 [3:40:51<24:04:34, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:38:51,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2272/17840 [3:40:51<24:04:34, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:38:51,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2272/17840 [3:40:51<24:04:34, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:38:51,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:55,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:51,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:58,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:51,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:58,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:51,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:38:58,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:38:51,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2274/17840 [3:41:01<22:55:29, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:04,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:04,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2275/17840 [3:41:06<22:39:54, 5.24s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:08,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:08,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:10,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:12,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:12,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:14,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:16,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:16,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:17,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:19,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:19,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:21,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:24,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:24,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:25,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:25,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:28,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:28,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:29,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:29,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:31,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:31,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:33,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:33,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:37,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:37,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:37,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:41,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:41,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:45,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:45,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:45,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:49,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:52,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:52,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:39:52,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2287/17840 [3:41:57<24:53:45, 5.76s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2287/17840 [3:41:57<24:53:45, 5.76s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2287/17840 [3:41:57<24:53:45, 5.76s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2287/17840 [3:41:57<24:53:45, 5.76s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2287/17840 [3:41:57<24:53:45, 5.76s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2288/17840 [3:42:04<26:46:23, 6.20s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2288/17840 [3:42:04<26:46:23, 6.20s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2288/17840 [3:42:04<26:46:23, 6.20s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:10,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:10,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5915, 'learning_rate': 9.236935866983374e-05, 'epoch': 2.57} +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:10,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:10,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:10,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2290/17840 [3:42:18<28:50:59, 6.68s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2290/17840 [3:42:18<28:50:59, 6.68s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:23,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2291/17840 [3:42:25<29:21:24, 6.80s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2291/17840 [3:42:25<29:21:24, 6.80s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7008, 'learning_rate': 9.235748218527317e-05, 'epoch': 2.57} + 13%|█████████▎ | 2291/17840 [3:42:25<29:21:24, 6.80s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2291/17840 [3:42:25<29:21:24, 6.80s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▎ | 2291/17840 [3:42:25<29:21:24, 6.80s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2292/17840 [3:42:32<29:33:31, 6.84s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2292/17840 [3:42:32<29:33:31, 6.84s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:37,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:37,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2293/17840 [3:42:39<29:41:08, 6.87s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2293/17840 [3:42:39<29:41:08, 6.87s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2293/17840 [3:42:39<29:41:08, 6.87s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:45,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:45,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8142, 'learning_rate': 9.233966745843231e-05, 'epoch': 2.57} +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:45,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:45,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:45,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2295/17840 [3:42:53<29:41:33, 6.88s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:55,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:40:55,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2296/17840 [3:43:00<29:35:23, 6.85s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2296/17840 [3:43:00<29:35:23, 6.85s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6087, 'learning_rate': 9.232779097387174e-05, 'epoch': 2.57} +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:04,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2297/17840 [3:43:06<29:29:30, 6.83s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2297/17840 [3:43:06<29:29:30, 6.83s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0833, 'learning_rate': 9.232185273159145e-05, 'epoch': 2.58} + 13%|█████████▍ | 2297/17840 [3:43:06<29:29:30, 6.83s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2297/17840 [3:43:06<29:29:30, 6.83s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2297/17840 [3:43:06<29:29:30, 6.83s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2298/17840 [3:43:13<29:19:23, 6.79s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:16,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:16,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:16,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2299/17840 [3:43:20<29:12:38, 6.77s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2299/17840 [3:43:20<29:12:38, 6.77s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2299/17840 [3:43:20<29:12:38, 6.77s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:26,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:26,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5618, 'learning_rate': 9.230403800475061e-05, 'epoch': 2.58} +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:26,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:33,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:33,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8228, 'learning_rate': 9.229809976247031e-05, 'epoch': 2.58} +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:36,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:36,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2302/17840 [3:43:40<29:05:42, 6.74s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2302/17840 [3:43:40<29:05:42, 6.74s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:43,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:43,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2303/17840 [3:43:47<28:58:59, 6.72s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2303/17840 [3:43:47<28:58:59, 6.72s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7972, 'learning_rate': 9.228622327790974e-05, 'epoch': 2.58} + 13%|█████████▍ | 2303/17840 [3:43:47<28:58:59, 6.72s/it]g-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:53,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:53,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6798, 'learning_rate': 9.228028503562945e-05, 'epoch': 2.58} +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:53,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:53,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:41:53,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:39:01,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2305/17840 [3:44:00<28:36:16, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:42:01,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2305/17840 [3:44:00<28:36:16, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:42:01,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2305/17840 [3:44:00<28:36:16, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:42:01,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2305/17840 [3:44:00<28:36:16, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:42:01,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2306/17840 [3:44:06<28:22:52, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2306/17840 [3:44:06<28:22:52, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2306/17840 [3:44:06<28:22:52, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2307/17840 [3:44:13<28:13:49, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2307/17840 [3:44:13<28:13:49, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:15,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:15,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2308/17840 [3:44:19<28:07:09, 6.52s/it]g-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2308/17840 [3:44:19<28:07:09, 6.52s/it]g-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8912, 'learning_rate': 9.225653206650832e-05, 'epoch': 2.59} +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:23,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2309/17840 [3:44:26<27:55:39, 6.47s/it]g-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2309/17840 [3:44:26<27:55:39, 6.47s/it]g-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6232, 'learning_rate': 9.225059382422804e-05, 'epoch': 2.59} + 13%|█████████▍ | 2309/17840 [3:44:26<27:55:39, 6.47s/it]g-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:31,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:31,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6131, 'learning_rate': 9.224465558194774e-05, 'epoch': 2.59} +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:31,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:37,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:37,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4199, 'learning_rate': 9.223871733966746e-05, 'epoch': 2.59} +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:37,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:37,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:44,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:44,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:44,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:50,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:50,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.476, 'learning_rate': 9.222684085510689e-05, 'epoch': 2.59} +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:50,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:50,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:56,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:56,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:42:56,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:02,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:02,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7362, 'learning_rate': 9.221496437054632e-05, 'epoch': 2.6} +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:02,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:02,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:08,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:08,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:13,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:13,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████���███▍ | 2317/17840 [3:45:15<26:20:03, 6.11s/it]g-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2317/17840 [3:45:15<26:20:03, 6.11s/it]g-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2318/17840 [3:45:21<25:59:40, 6.03s/it]g-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2318/17840 [3:45:21<25:59:40, 6.03s/it]g-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:24,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:24,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2319/17840 [3:45:27<25:40:01, 5.95s/it]g-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:29,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:29,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:29,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:42:07,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2320/17840 [3:45:32<25:16:30, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:43:33,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▍ | 2320/17840 [3:45:32<25:16:30, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:43:33,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:37,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:33,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:37,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:33,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9326, 'learning_rate': 9.217933491686461e-05, 'epoch': 2.6} +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:41,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:33,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:41,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:33,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2322/17840 [3:45:43<24:21:08, 5.65s/it]g-point operations will not be computed-18 12:43:33,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2322/17840 [3:45:43<24:21:08, 5.65s/it]g-point operations will not be computed-18 12:43:33,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:46,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:33,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:46,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:33,384 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2323/17840 [3:45:48<23:47:48, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2323/17840 [3:45:48<23:47:48, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2323/17840 [3:45:48<23:47:48, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:53,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:53,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:56,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:43:56,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2325/17840 [3:45:59<23:17:04, 5.40s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:00,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:00,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:03,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:05,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:05,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:07,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:09,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:09,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:11,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:13,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:13,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:14,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:17,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:17,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:19,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:19,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:22,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:22,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:24,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:24,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:26,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:26,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:27,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:27,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:35,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:35,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:38,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:42,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:42,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.809, 'learning_rate': 9.209026128266034e-05, 'epoch': 2.62} +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:46,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:46,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:44:46,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2337/17840 [3:46:50<24:55:26, 5.79s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2337/17840 [3:46:50<24:55:26, 5.79s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2337/17840 [3:46:50<24:55:26, 5.79s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2337/17840 [3:46:50<24:55:26, 5.79s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2337/17840 [3:46:50<24:55:26, 5.79s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2338/17840 [3:46:57<26:51:27, 6.24s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:45:00,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:45:00,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2339/17840 [3:47:05<28:06:13, 6.53s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2339/17840 [3:47:05<28:06:13, 6.53s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4156, 'learning_rate': 9.207244655581948e-05, 'epoch': 2.62} + 13%|█████████▌ | 2339/17840 [3:47:05<28:06:13, 6.53s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2339/17840 [3:47:05<28:06:13, 6.53s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2339/17840 [3:47:05<28:06:13, 6.53s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2340/17840 [3:47:12<28:52:59, 6.71s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:45:15,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:45:15,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2341/17840 [3:47:19<29:22:40, 6.82s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2341/17840 [3:47:19<29:22:40, 6.82s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7373, 'learning_rate': 9.206057007125891e-05, 'epoch': 2.62} + 13%|█████████▌ | 2341/17840 [3:47:19<29:22:40, 6.82s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2341/17840 [3:47:19<29:22:40, 6.82s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2341/17840 [3:47:19<29:22:40, 6.82s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2342/17840 [3:47:26<29:43:03, 6.90s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:45:29,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:45:29,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2343/17840 [3:47:33<29:59:44, 6.97s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2343/17840 [3:47:33<29:59:44, 6.97s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.628, 'learning_rate': 9.204869358669834e-05, 'epoch': 2.63} + 13%|█████████▌ | 2343/17840 [3:47:33<29:59:44, 6.97s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2343/17840 [3:47:33<29:59:44, 6.97s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2343/17840 [3:47:33<29:59:44, 6.97s/it]g-point operations will not be computed-18 12:43:49,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2344/17840 [3:47:40<30:04:54, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2344/17840 [3:47:40<30:04:54, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2344/17840 [3:47:40<30:04:54, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2344/17840 [3:47:40<30:04:54, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2345/17840 [3:47:47<30:00:58, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2345/17840 [3:47:47<30:00:58, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2345/17840 [3:47:47<30:00:58, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:45:53,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:45:53,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6512, 'learning_rate': 9.203087885985749e-05, 'epoch': 2.63} +[WARNING|modeling_utils.py:388] 2022-03-18 12:45:53,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:45:53,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:45:53,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2347/17840 [3:48:01<29:48:12, 6.93s/it]g-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:03,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:03,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2348/17840 [3:48:08<29:41:20, 6.90s/it]g-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2348/17840 [3:48:08<29:41:20, 6.90s/it]g-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.732, 'learning_rate': 9.201900237529691e-05, 'epoch': 2.63} + 13%|█████████▌ | 2348/17840 [3:48:08<29:41:20, 6.90s/it]g-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:14,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:14,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6781, 'learning_rate': 9.201306413301663e-05, 'epoch': 2.63} +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:14,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:14,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:14,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2350/17840 [3:48:22<30:01:47, 6.98s/it]g-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2350/17840 [3:48:22<30:01:47, 6.98s/it]g-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2350/17840 [3:48:22<30:01:47, 6.98s/it]g-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:28,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:28,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5898, 'learning_rate': 9.200118764845606e-05, 'epoch': 2.64} +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:28,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:28,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:28,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:45:41,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2352/17840 [3:48:35<29:18:52, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2352/17840 [3:48:35<29:18:52, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2352/17840 [3:48:35<29:18:52, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▌ | 2352/17840 [3:48:35<29:18:52, 6.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2353/17840 [3:48:42<29:02:35, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:44,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:44,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2354/17840 [3:48:48<28:50:22, 6.70s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2354/17840 [3:48:48<28:50:22, 6.70s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4868, 'learning_rate': 9.198337292161521e-05, 'epoch': 2.64} +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:52,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2355/17840 [3:48:55<28:35:32, 6.65s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2355/17840 [3:48:55<28:35:32, 6.65s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4536, 'learning_rate': 9.197743467933492e-05, 'epoch': 2.64} +[WARNING|modeling_utils.py:388] 2022-03-18 12:46:59,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2356/17840 [3:49:01<28:22:14, 6.60s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2356/17840 [3:49:01<28:22:14, 6.60s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7206, 'learning_rate': 9.197149643705464e-05, 'epoch': 2.64} + 13%|█████████▋ | 2356/17840 [3:49:01<28:22:14, 6.60s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:07,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:07,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4878, 'learning_rate': 9.196555819477434e-05, 'epoch': 2.64} +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:07,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:13,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:13,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5959, 'learning_rate': 9.195961995249406e-05, 'epoch': 2.64} +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:13,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:13,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:13,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2359/17840 [3:49:20<27:46:37, 6.46s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:23,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:23,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2360/17840 [3:49:27<27:33:39, 6.41s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2360/17840 [3:49:27<27:33:39, 6.41s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:29,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:29,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2361/17840 [3:49:33<27:21:03, 6.36s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2361/17840 [3:49:33<27:21:03, 6.36s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:35,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:35,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2362/17840 [3:49:39<27:09:34, 6.32s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2362/17840 [3:49:39<27:09:34, 6.32s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:41,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:41,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2363/17840 [3:49:45<26:51:24, 6.25s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2363/17840 [3:49:45<26:51:24, 6.25s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:47,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:47,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2364/17840 [3:49:51<26:41:51, 6.21s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2364/17840 [3:49:51<26:41:51, 6.21s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:54,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:47:54,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2365/17840 [3:49:57<26:34:16, 6.18s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2365/17840 [3:49:57<26:34:16, 6.18s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:00,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:00,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:00,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2366/17840 [3:50:03<26:20:59, 6.13s/it]g-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:06,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:06,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:06,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:46:36,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2367/17840 [3:50:09<26:02:22, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:48:10,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2367/17840 [3:50:09<26:02:22, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:48:10,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2367/17840 [3:50:09<26:02:22, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:48:10,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:14,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:10,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:14,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:10,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:18,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:10,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:18,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:10,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2369/17840 [3:50:21<25:09:54, 5.86s/it]g-point operations will not be computed-18 12:48:10,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:23,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:10,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:23,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:10,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:23,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:10,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2370/17840 [3:50:26<24:50:51, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:48:27,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2370/17840 [3:50:26<24:50:51, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:48:27,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2370/17840 [3:50:26<24:50:51, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:48:27,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:31,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:27,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:31,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:27,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:35,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:27,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:35,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:27,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2372/17840 [3:50:37<23:53:54, 5.56s/it]g-point operations will not be computed-18 12:48:27,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:39,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:27,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:39,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:27,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:39,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:27,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2373/17840 [3:50:42<23:17:29, 5.42s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:48:43,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:45,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:43,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:45,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:43,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2374/17840 [3:50:47<22:40:32, 5.28s/it]g-point operations will not be computed-18 12:48:43,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:49,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:43,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:51,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:43,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:51,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:43,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5067, 'learning_rate': 9.185866983372921e-05, 'epoch': 2.66} +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:55,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:43,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:55,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:43,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2376/17840 [3:50:57<21:29:51, 5.00s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:48:57,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:59,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:57,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:48:59,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:48:57,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2377/17840 [3:51:01<20:16:42, 4.72s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:01,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:49:03,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:01,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:49:03,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:01,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2378/17840 [3:51:04<19:00:52, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:05,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2378/17840 [3:51:04<19:00:52, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:05,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2379/17840 [3:51:08<17:48:53, 4.15s/it]g-point operations will not be computed-18 12:49:05,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2379/17840 [3:51:08<17:48:53, 4.15s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:08,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2379/17840 [3:51:08<17:48:53, 4.15s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:08,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2380/17840 [3:51:11<16:30:29, 3.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2380/17840 [3:51:11<16:30:29, 3.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2381/17840 [3:51:14<15:24:48, 3.59s/it]g-point operations will not be computed-18 12:49:11,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:49:15,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:14,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:49:15,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:14,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2382/17840 [3:51:17<14:05:05, 3.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:16,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▋ | 2382/17840 [3:51:17<14:05:05, 3.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:16,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2383/17840 [3:51:19<12:43:37, 2.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:19,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2383/17840 [3:51:19<12:43:37, 2.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:19,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2384/17840 [3:51:21<11:26:21, 2.66s/it]g-point operations will not be computed-18 12:49:19,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2384/17840 [3:51:21<11:26:21, 2.66s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:22,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2384/17840 [3:51:21<11:26:21, 2.66s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:22,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2385/17840 [3:51:28<17:46:31, 4.14s/it]g-point operations will not be computed-18 12:49:22,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2385/17840 [3:51:28<17:46:31, 4.14s/it]g-point operations will not be computed-18 12:49:22,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2385/17840 [3:51:28<17:46:31, 4.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:30,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2385/17840 [3:51:28<17:46:31, 4.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:30,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:49:33,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:30,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:49:33,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:30,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2386/17840 [3:51:36<21:56:23, 5.11s/it]g-point operations will not be computed-18 12:49:30,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2386/17840 [3:51:36<21:56:23, 5.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2386/17840 [3:51:36<21:56:23, 5.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2386/17840 [3:51:36<21:56:23, 5.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2386/17840 [3:51:36<21:56:23, 5.11s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2387/17840 [3:51:43<24:48:35, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2387/17840 [3:51:43<24:48:35, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:49:48,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2388/17840 [3:51:50<26:40:20, 6.21s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2388/17840 [3:51:50<26:40:20, 6.21s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6761, 'learning_rate': 9.178147268408551e-05, 'epoch': 2.68} + 13%|█████████▊ | 2388/17840 [3:51:50<26:40:20, 6.21s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2388/17840 [3:51:50<26:40:20, 6.21s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2388/17840 [3:51:50<26:40:20, 6.21s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2389/17840 [3:51:58<27:57:18, 6.51s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2389/17840 [3:51:58<27:57:18, 6.51s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:02,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2390/17840 [3:52:05<28:50:09, 6.72s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2390/17840 [3:52:05<28:50:09, 6.72s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6654, 'learning_rate': 9.176959619952494e-05, 'epoch': 2.68} + 13%|█████████▊ | 2390/17840 [3:52:05<28:50:09, 6.72s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2390/17840 [3:52:05<28:50:09, 6.72s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2390/17840 [3:52:05<28:50:09, 6.72s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2391/17840 [3:52:12<29:16:26, 6.82s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2391/17840 [3:52:12<29:16:26, 6.82s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2391/17840 [3:52:12<29:16:26, 6.82s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:18,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:18,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8756, 'learning_rate': 9.175771971496438e-05, 'epoch': 2.68} +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:18,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:18,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:18,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2393/17840 [3:52:26<29:43:23, 6.93s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:29,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:29,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:29,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2394/17840 [3:52:33<29:40:13, 6.92s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2394/17840 [3:52:33<29:40:13, 6.92s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2394/17840 [3:52:33<29:40:13, 6.92s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:39,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:39,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6315, 'learning_rate': 9.173990498812351e-05, 'epoch': 2.68} +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:39,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:39,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:39,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2396/17840 [3:52:46<29:34:48, 6.90s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:49,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:49,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2397/17840 [3:52:53<29:30:12, 6.88s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2397/17840 [3:52:53<29:30:12, 6.88s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4974, 'learning_rate': 9.172802850356294e-05, 'epoch': 2.69} + 13%|█████████▊ | 2397/17840 [3:52:53<29:30:12, 6.88s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:59,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:59,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6956, 'learning_rate': 9.172209026128266e-05, 'epoch': 2.69} +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:59,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:59,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:50:59,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2399/17840 [3:53:07<29:12:27, 6.81s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:51:09,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:51:09,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2400/17840 [3:53:14<29:49:05, 6.95s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2400/17840 [3:53:14<29:49:05, 6.95s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.578, 'learning_rate': 9.17102137767221e-05, 'epoch': 2.69} + 13%|█████████▊ | 2400/17840 [3:53:14<29:49:05, 6.95s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2400/17840 [3:53:14<29:49:05, 6.95s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2400/17840 [3:53:14<29:49:05, 6.95s/it]g-point operations will not be computed-18 12:49:37,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2401/17840 [3:53:21<29:34:24, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2401/17840 [3:53:21<29:34:24, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2401/17840 [3:53:21<29:34:24, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2402/17840 [3:53:28<29:21:06, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2402/17840 [3:53:28<29:21:06, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5609, 'learning_rate': 9.169833729216153e-05, 'epoch': 2.69} +[WARNING|modeling_utils.py:388] 2022-03-18 12:51:32,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2403/17840 [3:53:34<29:12:57, 6.81s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2403/17840 [3:53:34<29:12:57, 6.81s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9196, 'learning_rate': 9.169239904988124e-05, 'epoch': 2.69} + 13%|█████████▊ | 2403/17840 [3:53:34<29:12:57, 6.81s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:51:40,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:51:40,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5914, 'learning_rate': 9.168646080760096e-05, 'epoch': 2.7} +[WARNING|modeling_utils.py:388] 2022-03-18 12:51:40,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:51:40,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:51:40,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2405/17840 [3:53:48<28:43:40, 6.70s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:51:50,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:51:50,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2406/17840 [3:53:54<28:25:42, 6.63s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2406/17840 [3:53:54<28:25:42, 6.63s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:51:57,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:51:57,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2407/17840 [3:54:00<28:13:31, 6.58s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2407/17840 [3:54:00<28:13:31, 6.58s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7359, 'learning_rate': 9.16686460807601e-05, 'epoch': 2.7} +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:05,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2408/17840 [3:54:07<28:01:20, 6.54s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|█████████▊ | 2408/17840 [3:54:07<28:01:20, 6.54s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6156, 'learning_rate': 9.166270783847981e-05, 'epoch': 2.7} +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:11,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██���██████▊ | 2409/17840 [3:54:13<27:47:33, 6.48s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▊ | 2409/17840 [3:54:13<27:47:33, 6.48s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5857, 'learning_rate': 9.165676959619953e-05, 'epoch': 2.7} + 14%|█████████▊ | 2409/17840 [3:54:13<27:47:33, 6.48s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:19,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:19,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4645, 'learning_rate': 9.165083135391924e-05, 'epoch': 2.7} +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:19,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:25,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:25,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8167, 'learning_rate': 9.164489311163896e-05, 'epoch': 2.7} +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:25,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:31,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:31,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.529, 'learning_rate': 9.163895486935868e-05, 'epoch': 2.7} +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:31,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:38,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:38,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5985, 'learning_rate': 9.16330166270784e-05, 'epoch': 2.71} +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:38,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:44,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:44,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7157, 'learning_rate': 9.16270783847981e-05, 'epoch': 2.71} +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:44,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:50,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:50,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8243, 'learning_rate': 9.162114014251781e-05, 'epoch': 2.71} +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:50,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:50,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:56,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:52:56,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:00,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:00,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2417/17840 [3:55:02<25:54:40, 6.05s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2417/17840 [3:55:02<25:54:40, 6.05s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:06,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:06,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2418/17840 [3:55:08<25:40:14, 5.99s/it]g-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:10,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:10,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:10,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:51:22,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2419/17840 [3:55:14<25:16:45, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:53:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2419/17840 [3:55:14<25:16:45, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:53:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:19,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:19,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8756, 'learning_rate': 9.15914489311164e-05, 'epoch': 2.71} +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:23,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:23,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2421/17840 [3:55:25<24:22:58, 5.69s/it]g-point operations will not be computed-18 12:53:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2421/17840 [3:55:25<24:22:58, 5.69s/it]g-point operations will not be computed-18 12:53:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:28,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:28,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:15,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2422/17840 [3:55:30<23:54:02, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:53:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2422/17840 [3:55:30<23:54:02, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:53:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2422/17840 [3:55:30<23:54:02, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:53:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:35,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:35,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:38,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:38,978 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2424/17840 [3:55:40<22:55:54, 5.36s/it]g-point operations will not be computed-18 12:53:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:42,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:45,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:45,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:48,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:48,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:48,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:31,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2426/17840 [3:55:51<22:05:28, 5.16s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:53:51,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:53,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:51,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:53,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:51,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2427/17840 [3:55:55<20:51:36, 4.87s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:53:55,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:57,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:55,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:53:57,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:55,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2428/17840 [3:55:59<19:36:03, 4.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:53:59,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:54:01,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:59,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:54:01,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:53:59,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2429/17840 [3:56:02<18:19:57, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:02,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2429/17840 [3:56:02<18:19:57, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:02,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2430/17840 [3:56:06<17:04:36, 3.99s/it]g-point operations will not be computed-18 12:54:02,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:54:07,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:54:06,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:54:07,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:54:06,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2431/17840 [3:56:09<15:47:11, 3.69s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:09,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2431/17840 [3:56:09<15:47:11, 3.69s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:09,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2432/17840 [3:56:11<14:28:20, 3.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:11,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2432/17840 [3:56:11<14:28:20, 3.38s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:11,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2433/17840 [3:56:13<13:00:01, 3.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:13,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2433/17840 [3:56:13<13:00:01, 3.04s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:13,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2434/17840 [3:56:15<11:38:19, 2.72s/it]g-point operations will not be computed-18 12:54:13,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2434/17840 [3:56:15<11:38:19, 2.72s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:17,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2434/17840 [3:56:15<11:38:19, 2.72s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:17,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:54:20,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:54:17,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:54:20,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:54:17,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2435/17840 [3:56:23<18:02:56, 4.22s/it]g-point operations will not be computed-18 12:54:17,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2435/17840 [3:56:23<18:02:56, 4.22s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:24,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2435/17840 [3:56:23<18:02:56, 4.22s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:24,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:54:28,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:54:24,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:54:28,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:54:24,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2436/17840 [3:56:31<22:15:10, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:32,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2436/17840 [3:56:31<22:15:10, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:32,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2436/17840 [3:56:31<22:15:10, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:32,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2436/17840 [3:56:31<22:15:10, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:32,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2437/17840 [3:56:38<24:56:53, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:32,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2437/17840 [3:56:38<24:56:53, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:32,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2437/17840 [3:56:38<24:56:53, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:32,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2437/17840 [3:56:38<24:56:53, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:32,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2437/17840 [3:56:38<24:56:53, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:32,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2438/17840 [3:56:45<26:44:37, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2438/17840 [3:56:45<26:44:37, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2438/17840 [3:56:45<26:44:37, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2439/17840 [3:56:52<27:50:10, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2439/17840 [3:56:52<27:50:10, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5741, 'learning_rate': 9.147862232779098e-05, 'epoch': 2.73} + 14%|█████████▉ | 2439/17840 [3:56:52<27:50:10, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2439/17840 [3:56:52<27:50:10, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2439/17840 [3:56:52<27:50:10, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2440/17840 [3:56:59<28:37:50, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:02,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:02,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:02,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2441/17840 [3:57:06<29:01:17, 6.78s/it]g-point operations will not be computed-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2441/17840 [3:57:06<29:01:17, 6.78s/it]g-point operations will not be computed-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2441/17840 [3:57:06<29:01:17, 6.78s/it]g-point operations will not be computed-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2441/17840 [3:57:06<29:01:17, 6.78s/it]g-point operations will not be computed-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2441/17840 [3:57:06<29:01:17, 6.78s/it]g-point operations will not be computed-18 12:54:46,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2442/17840 [3:57:14<29:27:05, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2442/17840 [3:57:14<29:27:05, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2442/17840 [3:57:14<29:27:05, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2442/17840 [3:57:14<29:27:05, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2443/17840 [3:57:21<29:35:51, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2443/17840 [3:57:21<29:35:51, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|█████████▉ | 2443/17840 [3:57:21<29:35:51, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:27,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:27,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6559, 'learning_rate': 9.144893111638955e-05, 'epoch': 2.74} +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:27,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:27,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:27,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2445/17840 [3:57:35<29:45:21, 6.96s/it]g-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:37,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:37,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2446/17840 [3:57:41<29:38:11, 6.93s/it]g-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2446/17840 [3:57:41<29:38:11, 6.93s/it]g-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6714, 'learning_rate': 9.143705463182898e-05, 'epoch': 2.74} + 14%|██████████ | 2446/17840 [3:57:41<29:38:11, 6.93s/it]g-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:47,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:47,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6693, 'learning_rate': 9.14311163895487e-05, 'epoch': 2.74} +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:47,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:47,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2448/17840 [3:57:55<29:20:20, 6.86s/it]g-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2448/17840 [3:57:55<29:20:20, 6.86s/it]g-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:58,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:55:58,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2449/17840 [3:58:02<29:08:02, 6.81s/it]g-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2449/17840 [3:58:02<29:08:02, 6.81s/it]g-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7014, 'learning_rate': 9.141923990498813e-05, 'epoch': 2.75} +[WARNING|modeling_utils.py:388] 2022-03-18 12:56:06,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:56:06,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:55:15,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2450/17840 [3:58:09<29:34:59, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2450/17840 [3:58:09<29:34:59, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2450/17840 [3:58:09<29:34:59, 6.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2451/17840 [3:58:16<29:18:22, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2451/17840 [3:58:16<29:18:22, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:56:18,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:56:18,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2452/17840 [3:58:22<28:54:44, 6.76s/it]g-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2452/17840 [3:58:22<28:54:44, 6.76s/it]g-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7593, 'learning_rate': 9.140142517814728e-05, 'epoch': 2.75} +[WARNING|modeling_utils.py:388] 2022-03-18 12:56:26,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2453/17840 [3:58:29<28:44:28, 6.72s/it]g-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2453/17840 [3:58:29<28:44:28, 6.72s/it]g-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6579, 'learning_rate': 9.1395486935867e-05, 'epoch': 2.75} + 14%|██████████ | 2453/17840 [3:58:29<28:44:28, 6.72s/it]g-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:56:35,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:56:35,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7646, 'learning_rate': 9.13895486935867e-05, 'epoch': 2.75} +[WARNING|modeling_utils.py:388] 2022-03-18 12:56:35,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:56:41,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:56:41,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:56:41,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6021, 'learning_rate': 9.138361045130642e-05, 'epoch': 2.75} +[WARNING|modeling_utils.py:388] 2022-03-18 12:56:41,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:10,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2456/17840 [3:58:48<28:07:40, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2456/17840 [3:58:48<28:07:40, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.6161, 'learning_rate': 9.137767220902613e-05, 'epoch': 2.75} + 14%|██████████ | 2456/17840 [3:58:48<28:07:40, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2457/17840 [3:58:55<27:52:56, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2457/17840 [3:58:55<27:52:56, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:56:57,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:56:57,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2458/17840 [3:59:01<27:39:50, 6.47s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2458/17840 [3:59:01<27:39:50, 6.47s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:03,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:03,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:03,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2459/17840 [3:59:07<27:26:35, 6.42s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2459/17840 [3:59:07<27:26:35, 6.42s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:11,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:11,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2460/17840 [3:59:14<27:11:41, 6.37s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2460/17840 [3:59:14<27:11:41, 6.37s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:18,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:18,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2461/17840 [3:59:20<27:00:01, 6.32s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2461/17840 [3:59:20<27:00:01, 6.32s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:24,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:24,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2462/17840 [3:59:26<26:49:06, 6.28s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2462/17840 [3:59:26<26:49:06, 6.28s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2462/17840 [3:59:26<26:49:06, 6.28s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2462/17840 [3:59:26<26:49:06, 6.28s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:31,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:31,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:31,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:31,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:38,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:38,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:38,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:38,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:44,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:44,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:48,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:48,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2466/17840 [3:59:50<26:11:56, 6.13s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2466/17840 [3:59:50<26:11:56, 6.13s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:54,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:54,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2467/17840 [3:59:56<25:52:34, 6.06s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:58,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:58,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:57:58,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2468/17840 [4:00:02<25:27:36, 5.96s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:04,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:04,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:04,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2469/17840 [4:00:08<25:01:42, 5.86s/it]g-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:10,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:12,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:12,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4609, 'learning_rate': 9.129453681710213e-05, 'epoch': 2.77} +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:12,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:12,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:18,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:18,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:22,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:22,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:56:49,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2472/17840 [4:00:24<23:48:25, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:58:25,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2472/17840 [4:00:24<23:48:25, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:58:25,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:28,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:58:25,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:28,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:58:25,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5873, 'learning_rate': 9.12767220902613e-05, 'epoch': 2.77} +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:32,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:58:25,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:32,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:58:25,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2474/17840 [4:00:34<22:39:23, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:58:35,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████ | 2474/17840 [4:00:34<22:39:23, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:58:35,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:39,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:58:35,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:39,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:58:35,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4941, 'learning_rate': 9.126484560570072e-05, 'epoch': 2.77} +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:42,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:58:35,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:42,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:58:35,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2476/17840 [4:00:44<21:40:06, 5.08s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:58:44,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:46,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:58:44,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:46,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:58:44,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2477/17840 [4:00:48<20:34:46, 4.82s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:58:48,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:50,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:58:48,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:50,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:58:48,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2478/17840 [4:00:52<19:23:02, 4.54s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:58:52,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2478/17840 [4:00:52<19:23:02, 4.54s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:58:52,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2479/17840 [4:00:56<18:09:14, 4.25s/it]g-point operations will not be computed-18 12:58:52,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:57,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:58:56,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:58:57,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:58:56,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2480/17840 [4:00:59<16:44:42, 3.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:58:59,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2480/17840 [4:00:59<16:44:42, 3.92s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:58:59,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2481/17840 [4:01:02<15:14:20, 3.57s/it]g-point operations will not be computed-18 12:58:59,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2482/17840 [4:01:04<13:51:11, 3.25s/it]g-point operations will not be computed-18 12:59:01,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2482/17840 [4:01:04<13:51:11, 3.25s/it]g-point operations will not be computed-18 12:59:01,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:59:05,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:59:04,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:59:05,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:59:04,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2484/17840 [4:01:08<11:14:50, 2.64s/it]g-point operations will not be computed-18 12:59:06,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2484/17840 [4:01:08<11:14:50, 2.64s/it]g-point operations will not be computed-18 12:59:06,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2484/17840 [4:01:08<11:14:50, 2.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:09,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2484/17840 [4:01:08<11:14:50, 2.64s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:09,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:59:13,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:59:09,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:59:13,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:59:09,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2485/17840 [4:01:16<17:38:43, 4.14s/it]g-point operations will not be computed-18 12:59:09,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2485/17840 [4:01:16<17:38:43, 4.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:17,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2485/17840 [4:01:16<17:38:43, 4.14s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:17,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:59:21,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:59:17,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:59:21,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:59:17,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2486/17840 [4:01:23<21:53:49, 5.13s/it]g-point operations will not be computed-18 12:59:17,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2486/17840 [4:01:23<21:53:49, 5.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2486/17840 [4:01:23<21:53:49, 5.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2486/17840 [4:01:23<21:53:49, 5.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2486/17840 [4:01:23<21:53:49, 5.13s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:24,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2487/17840 [4:01:31<24:46:57, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2487/17840 [4:01:31<24:46:57, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2487/17840 [4:01:31<24:46:57, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2487/17840 [4:01:31<24:46:57, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2488/17840 [4:01:38<26:37:13, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2488/17840 [4:01:38<26:37:13, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2488/17840 [4:01:38<26:37:13, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2488/17840 [4:01:38<26:37:13, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2488/17840 [4:01:38<26:37:13, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2489/17840 [4:01:45<27:54:26, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:59:48,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:59:48,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 12:59:48,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2490/17840 [4:01:52<28:37:32, 6.71s/it]g-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2490/17840 [4:01:52<28:37:32, 6.71s/it]g-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2490/17840 [4:01:52<28:37:32, 6.71s/it]g-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2490/17840 [4:01:52<28:37:32, 6.71s/it]g-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2490/17840 [4:01:52<28:37:32, 6.71s/it]g-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2491/17840 [4:01:59<29:11:36, 6.85s/it]g-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 13:00:02,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 13:00:02,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2492/17840 [4:02:07<29:31:40, 6.93s/it]g-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2492/17840 [4:02:07<29:31:40, 6.93s/it]g-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7063, 'learning_rate': 9.116389548693587e-05, 'epoch': 2.79} + 14%|██████████▏ | 2492/17840 [4:02:07<29:31:40, 6.93s/it]g-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2492/17840 [4:02:07<29:31:40, 6.93s/it]g-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2492/17840 [4:02:07<29:31:40, 6.93s/it]g-point operations will not be computed-18 12:59:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2493/17840 [4:02:14<29:37:08, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2493/17840 [4:02:14<29:37:08, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2493/17840 [4:02:14<29:37:08, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2493/17840 [4:02:14<29:37:08, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2494/17840 [4:02:21<29:39:19, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2494/17840 [4:02:21<29:39:19, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2494/17840 [4:02:21<29:39:19, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 13:00:27,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 13:00:27,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.4199, 'learning_rate': 9.114608076009502e-05, 'epoch': 2.8} +[WARNING|modeling_utils.py:388] 2022-03-18 13:00:27,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 13:00:27,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 13:00:27,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2496/17840 [4:02:34<29:30:41, 6.92s/it]g-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2496/17840 [4:02:34<29:30:41, 6.92s/it]g-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 13:00:39,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2497/17840 [4:02:41<29:24:10, 6.90s/it]g-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2497/17840 [4:02:41<29:24:10, 6.90s/it]g-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.8041, 'learning_rate': 9.113420427553445e-05, 'epoch': 2.8} + 14%|██████████▏ | 2497/17840 [4:02:41<29:24:10, 6.90s/it]g-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 13:00:47,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 13:00:47,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.5056, 'learning_rate': 9.112826603325417e-05, 'epoch': 2.8} +[WARNING|modeling_utils.py:388] 2022-03-18 13:00:47,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 13:00:47,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-18 13:00:47,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-18 13:00:15,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2499/17840 [4:02:55<28:55:47, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 13:00:56,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2499/17840 [4:02:55<28:55:47, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 13:00:56,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▏ | 2499/17840 [4:02:55<28:55:47, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-18 13:00:56,023 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|trainer.py:2366] 2022-03-18 13:01:01,647 >> Num examples = 2642 | 2500/17840 [4:03:02<29:29:06, 6.92s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|trainer.py:2366] 2022-03-18 13:01:01,647 >> Num examples = 2642 | 2500/17840 [4:03:02<29:29:06, 6.92s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +{'loss': 3.4828, 'learning_rate': 9.11163895486936e-05, 'epoch': 2.8} +[INFO|trainer.py:2366] 2022-03-18 13:01:01,647 >> Num examples = 2642 | 2500/17840 [4:03:02<29:29:06, 6.92s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 1%|▊ | 3/331 [00:04<09:07, 1.67s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 1%|█ | 4/331 [00:07<10:26, 1.92s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|█▎ | 5/331 [00:10<13:10, 2.42s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|█▌ | 6/331 [00:13<15:04, 2.78s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|█▊ | 7/331 [00:16<14:45, 2.73s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|██ | 8/331 [00:19<15:30, 2.88s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 3%|██▎ | 9/331 [00:23<16:46, 3.13s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 3%|██▍ | 10/331 [00:27<18:51, 3.53s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 3%|██▋ | 11/331 [00:30<17:48, 3.34s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|██▉ | 12/331 [00:33<17:10, 3.23s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|███▏ | 13/331 [00:36<16:40, 3.14s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|███▍ | 14/331 [00:39<16:21, 3.10s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|███▋ | 15/331 [00:44<19:15, 3.66s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|███▉ | 16/331 [00:49<21:29, 4.09s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|████▏ | 17/331 [00:54<21:56, 4.19s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|████▍ | 18/331 [00:56<18:50, 3.61s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|████▋ | 19/331 [00:59<18:23, 3.54s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|████▉ | 20/331 [01:02<16:19, 3.15s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|█████▏ | 21/331 [01:06<17:40, 3.42s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 7%|█████▍ | 22/331 [01:11<20:08, 3.91s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 7%|█████▋ | 23/331 [01:16<22:57, 4.47s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 7%|█████▉ | 24/331 [01:22<24:55, 4.87s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▏ | 25/331 [01:26<23:32, 4.62s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▍ | 26/331 [01:29<20:53, 4.11s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▋ | 27/331 [01:34<21:13, 4.19s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▉ | 28/331 [01:37<20:13, 4.01s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|███████▏ | 29/331 [01:41<19:15, 3.82s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|███████▍ | 30/331 [01:43<17:46, 3.54s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|███████▋ | 31/331 [01:46<16:29, 3.30s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 10%|███████▉ | 32/331 [01:49<15:57, 3.20s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 10%|████████▏ | 33/331 [01:52<16:03, 3.23s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 10%|████████▍ | 34/331 [01:56<16:03, 3.25s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|████████▋ | 35/331 [01:59<16:35, 3.36s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|████████▉ | 36/331 [02:04<18:12, 3.70s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|█████████▏ | 37/331 [02:09<19:53, 4.06s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|█████████▍ | 38/331 [02:13<20:26, 4.18s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 12%|█████████▋ | 39/331 [02:18<20:38, 4.24s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 12%|█████████▉ | 40/331 [02:20<17:49, 3.68s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 12%|██████████▏ | 41/331 [02:23<16:15, 3.36s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▍ | 42/331 [02:28<18:26, 3.83s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▋ | 43/331 [02:32<19:59, 4.16s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▉ | 44/331 [02:38<21:09, 4.42s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 14%|███████████▏ | 45/331 [02:41<19:15, 4.04s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 14%|███████████▍ | 46/331 [02:43<16:47, 3.53s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 14%|███████████▋ | 47/331 [02:45<14:54, 3.15s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|███████████▉ | 48/331 [02:49<15:37, 3.31s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|████████████▏ | 49/331 [02:53<17:11, 3.66s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|████████████▍ | 50/331 [02:57<17:06, 3.65s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|████████████▋ | 51/331 [03:01<17:45, 3.81s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 16%|████████████▉ | 52/331 [03:04<16:30, 3.55s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 16%|█████████████▏ | 53/331 [03:08<16:36, 3.58s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 16%|█████████████▍ | 54/331 [03:10<15:03, 3.26s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|█████████████▋ | 55/331 [03:15<17:34, 3.82s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|█████████████▊ | 56/331 [03:19<17:10, 3.75s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|██████████████ | 57/331 [03:22<16:19, 3.58s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▎ | 58/331 [03:27<17:29, 3.84s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▌ | 59/331 [03:29<15:40, 3.46s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▊ | 60/331 [03:32<15:00, 3.32s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|███████████████ | 61/331 [03:36<16:05, 3.58s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 19%|███████████████▎ | 62/331 [03:40<15:30, 3.46s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 19%|███████████████▌ | 63/331 [03:45<17:58, 4.02s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 19%|███████████████▊ | 64/331 [03:48<16:46, 3.77s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████ | 65/331 [03:51<16:09, 3.64s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████▎ | 66/331 [03:57<18:59, 4.30s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████▌ | 67/331 [04:03<20:18, 4.62s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|████████████████▊ | 68/331 [04:07<20:26, 4.66s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████ | 69/331 [04:12<19:41, 4.51s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████▎ | 70/331 [04:16<19:21, 4.45s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████▌ | 71/331 [04:21<19:50, 4.58s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|█████████████████▊ | 72/331 [04:25<19:47, 4.59s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|██████████████████ | 73/331 [04:29<18:40, 4.34s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|██████████████████▎ | 74/331 [04:33<18:18, 4.28s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|██████████████████▌ | 75/331 [04:38<19:07, 4.48s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|██████████████████▊ | 76/331 [04:42<17:34, 4.14s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|███████████████████ | 77/331 [04:45<16:52, 3.99s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▎ | 78/331 [04:48<15:36, 3.70s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▌ | 79/331 [04:51<14:39, 3.49s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▌ | 79/331 [04:51<14:39, 3.49s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▌ | 79/331 [04:51<14:39, 3.49s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|████████████████████ | 81/331 [04:59<15:23, 3.69s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▎ | 82/331 [05:02<14:53, 3.59s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▌ | 83/331 [05:06<15:42, 3.80s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▊ | 84/331 [05:12<17:46, 4.32s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▊ | 84/331 [05:12<17:46, 4.32s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▊ | 84/331 [05:12<17:46, 4.32s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 26%|█████████████████████▎ | 86/331 [05:20<17:01, 4.17s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 26%|█████████████████████▌ | 87/331 [05:23<16:15, 4.00s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|█████████████████████▊ | 88/331 [05:27<15:28, 3.82s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|██████████████████████ | 89/331 [05:29<13:37, 3.38s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|██████████████████████▎ | 90/331 [05:31<12:30, 3.11s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|██████████████████████▌ | 91/331 [05:36<13:51, 3.47s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|██████████████████████▊ | 92/331 [05:38<12:16, 3.08s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|███████████████████████ | 93/331 [05:41<12:37, 3.18s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|███████████████████████▎ | 94/331 [05:45<13:13, 3.35s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 29%|███████████████████████▌ | 95/331 [05:49<13:26, 3.42s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 29%|███████████████████████▊ | 96/331 [05:52<13:41, 3.49s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 29%|████████████████████████ | 97/331 [05:55<12:44, 3.27s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 30%|████████████████████████▎ | 98/331 [05:59<13:39, 3.52s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 30%|████████████████████████▌ | 99/331 [06:03<13:39, 3.53s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 30%|████████████████████████▍ | 100/331 [06:05<12:36, 3.28s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|████████████████████████▋ | 101/331 [06:09<12:29, 3.26s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|████████████████████████▉ | 102/331 [06:14<14:30, 3.80s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|█████████████████████████▏ | 103/331 [06:17<13:17, 3.50s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|█████████████████████████▍ | 104/331 [06:20<13:03, 3.45s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 32%|█████████████████████████▋ | 105/331 [06:23<13:03, 3.47s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 32%|█████████████████████████▉ | 106/331 [06:27<13:08, 3.50s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 32%|██████████████████████████▏ | 107/331 [06:29<11:35, 3.10s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▍ | 108/331 [06:32<11:12, 3.02s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▋ | 109/331 [06:35<11:10, 3.02s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▉ | 110/331 [06:39<12:26, 3.38s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▏ | 111/331 [06:43<12:40, 3.46s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▍ | 112/331 [06:46<12:46, 3.50s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▋ | 113/331 [06:49<11:35, 3.19s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▉ | 114/331 [06:52<11:56, 3.30s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 35%|████████████████████████████▏ | 115/331 [06:56<12:05, 3.36s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 35%|████████████████████████████▍ | 116/331 [07:00<12:42, 3.55s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 35%|████████████████████████████▋ | 117/331 [07:04<12:42, 3.56s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 36%|████████████████████████████▉ | 118/331 [07:07<12:02, 3.39s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 36%|█████████████████████████████ | 119/331 [07:10<11:55, 3.38s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 36%|█████████████████████████████▎ | 120/331 [07:13<11:59, 3.41s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|█████████████████████████████▌ | 121/331 [07:18<13:04, 3.74s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|█████████████████████████████▊ | 122/331 [07:21<12:33, 3.60s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|██████████████████████████████ | 123/331 [07:26<14:05, 4.06s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|██████████████████████████████▎ | 124/331 [07:30<13:44, 3.98s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|██████████████████████████████▌ | 125/331 [07:35<14:59, 4.37s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|██████████████████████████████▊ | 126/331 [07:40<15:05, 4.42s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|███████████████████████████████ | 127/331 [07:45<15:55, 4.68s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▎ | 128/331 [07:50<16:03, 4.75s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▌ | 129/331 [07:54<15:30, 4.60s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▊ | 130/331 [07:59<15:50, 4.73s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████ | 131/331 [08:05<16:17, 4.89s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████▎ | 132/331 [08:08<15:00, 4.52s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████▌ | 133/331 [08:11<13:26, 4.07s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████▊ | 134/331 [08:15<12:43, 3.87s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████ | 135/331 [08:19<13:05, 4.01s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████▎ | 136/331 [08:24<13:53, 4.27s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████▌ | 137/331 [08:29<14:36, 4.52s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|█████████████████████████████████▊ | 138/331 [08:34<15:04, 4.69s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|██████████████████████████████████ | 139/331 [08:36<12:30, 3.91s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|██████████████████████████████████▎ | 140/331 [08:42<14:05, 4.42s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 43%|██████████████████████████████████▌ | 141/331 [08:45<12:56, 4.09s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 43%|██████████████████████████████████▋ | 142/331 [08:49<12:27, 3.96s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 43%|██████████████████████████████████▉ | 143/331 [08:54<13:21, 4.26s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▏ | 144/331 [08:57<12:36, 4.05s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▍ | 145/331 [09:01<12:17, 3.97s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▋ | 146/331 [09:06<13:21, 4.33s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▉ | 147/331 [09:10<12:38, 4.12s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 45%|████████████████████████████████████▏ | 148/331 [09:13<11:26, 3.75s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 45%|████████████████████████████████████▍ | 149/331 [09:15<10:16, 3.39s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 45%|████████████████████████████████████▋ | 150/331 [09:20<11:06, 3.68s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 46%|███████���████████████████████████████▉ | 151/331 [09:23<10:49, 3.61s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 46%|█████████████████████████████████████▏ | 152/331 [09:26<09:51, 3.31s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 46%|█████████████████████████████████████▍ | 153/331 [09:29<09:32, 3.22s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|█████████████████████████████████████▋ | 154/331 [09:33<10:31, 3.57s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|█████████████████████████████████████▉ | 155/331 [09:38<11:33, 3.94s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|██████████████████████████████████████▏ | 156/331 [09:43<12:19, 4.23s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|██████████████████████████████████████▍ | 157/331 [09:48<13:05, 4.51s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|██████████████████████████████████████▋ | 158/331 [09:53<13:20, 4.63s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|██████████████████████████████████████▉ | 159/331 [09:58<13:15, 4.62s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|███████████████████████████████████████▏ | 160/331 [10:01<12:01, 4.22s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|��██████████████████████████████████████▍ | 161/331 [10:04<11:29, 4.06s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▋ | 162/331 [10:10<12:21, 4.39s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▉ | 163/331 [10:14<12:30, 4.46s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▉ | 163/331 [10:14<12:30, 4.46s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▉ | 163/331 [10:14<12:30, 4.46s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▍ | 165/331 [10:22<11:14, 4.06s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▌ | 166/331 [10:25<10:46, 3.92s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▊ | 167/331 [10:30<11:09, 4.08s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████ | 168/331 [10:33<10:10, 3.75s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████▎ | 169/331 [10:37<10:31, 3.90s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████▌ | 170/331 [10:40<09:38, 3.59s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 52%|█████████████████████████████████████████▊ | 171/331 [10:43<09:32, 3.58s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 52%|██████████████████████████████████████████ | 172/331 [10:46<08:49, 3.33s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 52%|██████████████████████████████████████████▎ | 173/331 [10:50<09:16, 3.52s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|██████████████████████████████████████████▌ | 174/331 [10:53<08:40, 3.32s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|██████████████████████████████████████████▊ | 175/331 [10:57<08:56, 3.44s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|███████████████████████████████████████████ | 176/331 [10:59<08:28, 3.28s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|███████████████████████████████████████████▎ | 177/331 [11:04<09:19, 3.63s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 54%|███████████████████████████████████████████▌ | 178/331 [11:09<10:23, 4.08s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 54%|███████████████████████████████████████████▊ | 179/331 [11:14<11:12, 4.42s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 54%|████████████████████████████████████████████ | 180/331 [11:18<10:54, 4.33s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|████████████████████████████████████████████▎ | 181/331 [11:23<10:44, 4.30s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|████████████████████████████████████████████▌ | 182/331 [11:25<09:21, 3.77s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|████████████████████████████████████████████▊ | 183/331 [11:27<08:10, 3.32s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████ | 184/331 [11:30<07:18, 2.98s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▎ | 185/331 [11:32<06:29, 2.67s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▌ | 186/331 [11:35<06:59, 2.89s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▊ | 187/331 [11:40<08:16, 3.45s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 57%|██████████████████████████████████████████████ | 188/331 [11:43<08:16, 3.47s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 57%|██████████████████████████████████████████████▎ | 189/331 [11:46<07:31, 3.18s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 57%|██████████████████████████████████████████████▍ | 190/331 [11:48<06:59, 2.97s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|██████████████████████████████████████████████▋ | 191/331 [11:51<06:53, 2.96s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|██████████████████████████████████████████████▉ | 192/331 [11:54<06:30, 2.81s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|███████████████████████████████████████████████▏ | 193/331 [11:58<07:34, 3.29s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 59%|███████████████████████████████████████████████▍ | 194/331 [12:00<06:50, 3.00s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 59%|███████████████████████████████████████████████▋ | 195/331 [12:03<06:33, 2.89s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 59%|███████████████████████████████████████████████▉ | 196/331 [12:06<06:50, 3.04s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▏ | 197/331 [12:11<07:32, 3.38s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▍ | 198/331 [12:13<06:51, 3.10s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▋ | 199/331 [12:17<07:05, 3.23s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▉ | 200/331 [12:19<06:25, 2.94s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|█████████████████████████████████████████████████▏ | 201/331 [12:22<06:16, 2.89s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|█████████████████████████████████████████████████▍ | 202/331 [12:25<06:40, 3.10s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|█████████████████████████████████████████████████▋ | 203/331 [12:29<06:45, 3.17s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|█████████████████████████████████████████████████▉ | 204/331 [12:33<07:31, 3.55s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|██████████████████████████████████████████████████▏ | 205/331 [12:37<07:42, 3.67s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|██████████████████████████████████████████████████▍ | 206/331 [12:40<07:34, 3.64s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|██████████████████████████████████████████████████▋ | 207/331 [12:45<08:12, 3.98s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|██████████████████████████████████████████████████▉ | 208/331 [12:50<08:24, 4.10s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|███████████████████████████████████████████████████▏ | 209/331 [12:52<07:16, 3.58s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|███████████████████████████████████████████████████▍ | 210/331 [12:54<06:24, 3.18s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 64%|███████████████████████████████████████████████████▋ | 211/331 [12:58<06:34, 3.29s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 64%|███████████████████████████████████████████████████▉ | 212/331 [13:00<06:02, 3.05s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 64%|████████████████████████████████████████████████████ | 213/331 [13:03<06:06, 3.11s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▎ | 214/331 [13:06<05:32, 2.84s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▌ | 215/331 [13:08<05:04, 2.63s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▊ | 216/331 [13:13<06:15, 3.27s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████ | 217/331 [13:16<06:11, 3.26s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████▎ | 218/331 [13:20<06:47, 3.60s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████▌ | 219/331 [13:24<06:38, 3.56s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████▊ | 220/331 [13:26<06:08, 3.32s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████ | 221/331 [13:30<06:17, 3.43s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████▎ | 222/331 [13:33<05:45, 3.17s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████▌ | 223/331 [13:36<05:54, 3.28s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|██████████████████████████████████████████████████████▊ | 224/331 [13:40<05:59, 3.36s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|███████████████████████████████████████████████████████ | 225/331 [13:43<06:01, 3.41s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|███████████████████████████████████████████████████████▎ | 226/331 [13:48<06:37, 3.79s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|███████████████████████████████████████████████████████▌ | 227/331 [13:51<06:24, 3.69s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|███████████████████████████████████████████████████████▊ | 228/331 [13:55<06:05, 3.55s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|████████████████████████████████████████████████████████ | 229/331 [13:58<05:55, 3.49s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|████████████████████████████████████████████████████████▎ | 230/331 [14:01<05:37, 3.34s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|████████████████████████████████████████████████████████▌ | 231/331 [14:05<05:55, 3.56s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|████████████████████████████████████████████████████████▊ | 232/331 [14:08<05:44, 3.48s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|█████████████████████████████████████████████████████████ | 233/331 [14:13<06:04, 3.72s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|█████████████████████████████████████████████████████████▎ | 234/331 [14:15<05:31, 3.42s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|█████████████████████████████████████████████████████████▌ | 235/331 [14:18<05:09, 3.22s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|█████████████████████████████████████████████████████████▊ | 236/331 [14:24<06:15, 3.95s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|█████████████████████████████████████████████████████████▉ | 237/331 [14:29<06:43, 4.29s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|██████████████████████████████████████████████████████████▏ | 238/331 [14:33<06:36, 4.27s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|██████████████████████████████████████████████████████████▍ | 239/331 [14:37<06:34, 4.29s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|██████████████████████████████████████████████████████████▋ | 240/331 [14:42<06:47, 4.48s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|██████████████████████████████████████████████████████████▉ | 241/331 [14:47<06:58, 4.65s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|███████████████████████████████████████████████████████████▏ | 242/331 [14:52<07:01, 4.73s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|███████████████████████████████████████████████████████████▍ | 243/331 [14:57<06:52, 4.69s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|███████████████████████████████████████████████████████████▋ | 244/331 [15:02<07:03, 4.87s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|███████████████████████████████████████████████████████████▉ | 245/331 [15:06<06:41, 4.67s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|████████████████████████████████████████████████████████████▏ | 246/331 [15:12<07:05, 5.00s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 75%|████████████████████████████████████████████████████████████▍ | 247/331 [15:16<06:41, 4.77s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 75%|████████████████████████████████████████████████████████████▋ | 248/331 [15:20<05:59, 4.33s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 75%|████████████████████████████████████████████████████████████▉ | 249/331 [15:22<05:11, 3.80s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▏ | 250/331 [15:25<04:45, 3.52s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▍ | 251/331 [15:29<04:54, 3.68s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▋ | 252/331 [15:32<04:28, 3.39s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▉ | 253/331 [15:36<04:50, 3.72s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▏ | 254/331 [15:40<04:37, 3.60s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▍ | 255/331 [15:44<04:52, 3.85s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▋ | 256/331 [15:48<04:36, 3.69s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|██████████████████████████████████████████████████████████████▉ | 257/331 [15:52<04:49, 3.91s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|███████████████████████████████████████████████████████████████▏ | 258/331 [15:55<04:16, 3.51s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|███████████████████████████████████████████████████████████████▍ | 259/331 [15:58<04:08, 3.46s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|███████████████████████████████████████████████████████████████▋ | 260/331 [16:02<04:17, 3.63s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|███████████████████████████████████████████████████████████████▊ | 261/331 [16:04<03:46, 3.24s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|████████████████████████████████████████████████████████████████ | 262/331 [16:08<03:46, 3.29s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|████████████████████████████████████████████████████████████████▎ | 263/331 [16:12<04:07, 3.64s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|██████████��█████████████████████████████████████████████████████▌ | 264/331 [16:15<03:50, 3.45s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|████████████████████████████████████████████████████████████████▊ | 265/331 [16:18<03:38, 3.32s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|█████████████████████████████████████████████████████████████████ | 266/331 [16:21<03:28, 3.21s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 81%|█████████████████████████████████████████████████████████████████▎ | 267/331 [16:26<03:50, 3.60s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 81%|█████████████████████████████████████████████████████████████████▌ | 268/331 [16:29<03:44, 3.56s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 81%|█████████████████████████████████████████████████████████████████▊ | 269/331 [16:34<04:08, 4.01s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████ | 270/331 [16:38<04:00, 3.94s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▎ | 271/331 [16:43<04:13, 4.23s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▌ | 272/331 [16:46<03:53, 3.96s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▊ | 273/331 [16:50<03:53, 4.02s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 83%|███████████████████████████████████████████████████████████████████ | 274/331 [16:55<04:08, 4.36s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 83%|███████████████████████████████████████████████████████████████████▎ | 275/331 [17:00<04:07, 4.42s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 83%|███████████████████████████████████████████████████████████████████▌ | 276/331 [17:03<03:40, 4.00s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 84%|███████████████████████████████████████████████████████████████████▊ | 277/331 [17:07<03:28, 3.87s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 84%|████████████████████████████████████████████████████████████████████ | 278/331 [17:10<03:21, 3.79s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 84%|████████████████████████████████████████████████████████████████████▎ | 279/331 [17:16<03:47, 4.37s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|████████████████████████████████████████████████████████████████████▌ | 280/331 [17:20<03:34, 4.21s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|████████████████████████████████████████████████████████████████████▊ | 281/331 [17:25<03:42, 4.46s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|█████████████████████████████████████████████████████████████████████ | 282/331 [17:29<03:37, 4.43s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|█████████████████████████████████████████████████████████████████████▎ | 283/331 [17:34<03:42, 4.64s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▍ | 284/331 [17:40<03:47, 4.83s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▋ | 285/331 [17:45<03:47, 4.95s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▉ | 286/331 [17:50<03:45, 5.02s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 87%|██████████████████████████████████████████████████████████████████████▏ | 287/331 [17:56<03:50, 5.23s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 87%|██████████████████████████████████████████████████████████████████████▍ | 288/331 [18:01<03:44, 5.22s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 87%|██████████████████████████████████████████████████████████████████████▋ | 289/331 [18:04<03:19, 4.74s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 88%|██████████████████████████████████████████████████████████████████████▉ | 290/331 [18:08<02:57, 4.33s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 88%|███████████████████████████████████████████████████████████████████████▏ | 291/331 [18:11<02:37, 3.93s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 88%|███████████████████████████████████████████████████████████████████████▍ | 292/331 [18:14<02:26, 3.76s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|███████████████████████████████████████████████████████████████████████▋ | 293/331 [18:18<02:22, 3.75s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|███████████████████████████████████████████████████████████████████████▉ | 294/331 [18:21<02:07, 3.45s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|████████████████████████████████████████████████████████████████████████▏ | 295/331 [18:24<01:58, 3.29s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|████████████████████████████████████████████████████████████████████████▍ | 296/331 [18:26<01:48, 3.11s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|████████████████████████████████████████████████████████████████████████▋ | 297/331 [18:32<02:07, 3.76s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|████████████████████████████████████████████████████████████████████████▉ | 298/331 [18:37<02:20, 4.24s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|█████████████████████████████████████████████████████████████████████████▏ | 299/331 [18:40<02:07, 4.00s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 91%|█████████████████████████████████████████████████████████████████████████▍ | 300/331 [18:44<02:02, 3.96s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 91%|█████████████████████████████████████████████████████████████████████████▋ | 301/331 [18:48<01:55, 3.85s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 91%|█████████████████████████████████████████████████████████████████████████▉ | 302/331 [18:51<01:47, 3.70s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▏ | 303/331 [18:54<01:37, 3.47s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▍ | 304/331 [18:58<01:40, 3.71s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▋ | 305/331 [19:03<01:43, 3.96s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▉ | 306/331 [19:08<01:49, 4.36s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▏ | 307/331 [19:14<01:51, 4.66s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▎ | 308/331 [19:19<01:54, 4.96s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▌ | 309/331 [19:25<01:51, 5.08s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|███████████████████████████████████████████████████████████████████████████▊ | 310/331 [19:28<01:35, 4.55s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|████████████████████████████████████████████████████████████████████████████ | 311/331 [19:32<01:31, 4.55s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|████████████████████████████████████████████████████████████████████████████▎ | 312/331 [19:36<01:17, 4.10s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|████████████████████████████████████████████████████████████████████████████▌ | 313/331 [19:39<01:10, 3.94s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|████████████████████████████████████████████████████████████████████████████▊ | 314/331 [19:44<01:09, 4.09s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|█████████████████████████████████████████████████████████████████████████████ | 315/331 [19:48<01:08, 4.26s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|█████████████████████████████████████████████████████████████████████████████▎ | 316/331 [19:53<01:04, 4.30s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 96%|█████████��███████████████████████████████████████████████████████████████████▌ | 317/331 [19:58<01:04, 4.60s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 96%|█████████████████████████████████████████████████████████████████████████████▊ | 318/331 [20:01<00:54, 4.16s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 96%|██████████████████████████████████████████████████████████████████████████████ | 319/331 [20:04<00:46, 3.83s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 97%|██████████████████████████████████████████████████████████████████████████████▎ | 320/331 [20:08<00:43, 3.94s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 97%|██████████████████████████████████████████████████████████████████████████████▌ | 321/331 [20:12<00:38, 3.87s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 97%|██████████████████████████████████████████████████████████████████████████████▊ | 322/331 [20:17<00:38, 4.24s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████ | 323/331 [20:21<00:32, 4.04s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▎ | 324/331 [20:26<00:30, 4.35s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▌ | 325/331 [20:30<00:26, 4.38s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▊ | 326/331 [20:35<00:22, 4.44s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 99%|████████████████████████████████████████████████████████████████████████████████ | 327/331 [20:39<00:17, 4.45s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 99%|████████████████████████████████████████████████████████████████████████████████▎| 328/331 [20:44<00:13, 4.55s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 99%|████████████████████████████████████████████████████████████████████████████████▌| 329/331 [20:48<00:08, 4.39s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +100%|████████████████████████████████████████████████████████████████████████████████▊| 330/331 [20:53<00:04, 4.71s/it][INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|configuration_utils.py:438] 2022-03-18 13:22:00,734 >> Configuration saved in ./checkpoint-2500/config.json [INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|configuration_utils.py:438] 2022-03-18 13:22:00,734 >> Configuration saved in ./checkpoint-2500/config.json [INFO|trainer.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +03/18/2022 13:22:00 - INFO - datasets.metric - Removing /home/sanchit_huggingface_co/.cache/huggingface/metrics/wer/default/default_experiment-1-0.arrow +[INFO|feature_extraction_utils.py:324] 2022-03-18 13:22:17,597 >> Configuration saved in ./checkpoint-2500/preprocessor_config.jsoner.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|feature_extraction_utils.py:324] 2022-03-18 13:22:17,597 >> Configuration saved in ./checkpoint-2500/preprocessor_config.jsoner.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|feature_extraction_utils.py:324] 2022-03-18 13:22:17,597 >> Configuration saved in ./checkpoint-2500/preprocessor_config.jsoner.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|feature_extraction_utils.py:324] 2022-03-18 13:22:17,597 >> Configuration saved in ./checkpoint-2500/preprocessor_config.jsoner.py:560] 2022-03-18 13:01:01,641 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message.